adding kustomization

2025-09-13 11:44:13 -04:00
parent 469dfcd094
commit a4952581ec
17 changed files with 381 additions and 2 deletions
@@ -7,6 +7,8 @@ spec:
    destinations:
        - server: https://kubernetes.default.svc
          namespace: ai
        - server: https://kubernetes.default.svc
          namespace: argo
        # # only add if need to deploy into argocd (ehhhhh)
        # - server: https://kubernetes.default.svc
        #   namespace: argocd
@@ -27,8 +29,6 @@ spec:
        repoURL: https://git.ion606.com/ion606/ollama-plus
        targetRevision: argo
        path: apps/children
        directory:
            recurse: true
    syncPolicy:
        automated:
            prune: true
@@ -0,0 +1,18 @@
 apiVersion: argoproj.io/v1alpha1
 kind: Application
 metadata:
    name: argo-templates
    namespace: ai
 spec:
    project: ai-stack
    destination:
        server: https://kubernetes.default.svc
        namespace: argo
    source:
        repoURL: https://git.ion606.com/ion606/ollama-plus
        targetRevision: main
        path: apps/argo-templates
    syncPolicy:
        automated:
            prune: true
            selfHeal: true
@@ -0,0 +1,20 @@
 apiVersion: argoproj.io/v1alpha1
 kind: Application
 metadata:
    name: ollama-scheduler
    namespace: ai
    labels:
        repo.ion606.com/ollama-plus: "true"
 spec:
    project: ai-stack
    destination:
        server: https://kubernetes.default.svc
        namespace: argo
    source:
        repoURL: https://git.ion606.com/ion606/ollama-plus
        targetRevision: main
        path: manifests/argo-ollama-scheduler
    syncPolicy:
        automated:
            prune: true
            selfHeal: true
@@ -3,6 +3,8 @@ kind: Application
 metadata:
    name: coderunner
    namespace: ai
    labels:
        repo.ion606.com/ollama-plus: "true"
 spec:
    project: ai-stack
    destination:
@@ -0,0 +1,35 @@
 apiVersion: kustomize.config.k8s.io/v1beta1
 kind: Kustomization
 resources:
    - argo-ollama-scheduler.yaml
    - coderunner.yaml
    - tools.yaml
    - rag-server.yaml
    - openwebui.yaml
    - postgresql.yaml
    - searxng.yaml
    - browser.yaml
 generatorOptions:
    disableNameSuffixHash: true
 configMapGenerator:
    - name: ollama-plus-revs
      literals:
          - targetRevision=main
 # Inject targetRevision from the ConfigMap into apps (kill me)
 replacements:
    - source:
          kind: ConfigMap
          name: ollama-plus-revs
          fieldPath: data.targetRevision
      targets:
          - select:
                kind: Application
                labelSelector: repo.ion606.com/ollama-plus=true
            fieldPaths:
                - spec.source.targetRevision
            options:
                create: true
@@ -3,6 +3,8 @@ kind: Application
 metadata:
    name: rag-server
    namespace: ai
    labels:
        repo.ion606.com/ollama-plus: "true"
 spec:
    project: ai-stack
    destination:
@@ -3,6 +3,8 @@ kind: Application
 metadata:
    name: tools
    namespace: ai
    labels:
        repo.ion606.com/ollama-plus: "true"
 spec:
    project: ai-stack
    destination:
@@ -0,0 +1,46 @@
 apiVersion: apps/v1
 kind: Deployment
 metadata:
  name: schedules-api
  namespace: argo
 spec:
  replicas: 1
  selector:
    matchLabels: { app: schedules-api }
  template:
    metadata:
      labels: { app: schedules-api }
    spec:
      serviceAccountName: schedules-api
      containers:
        - name: schedules-api
          # TODO: build & push your image, then update below
          image: ghcr.io/your-org/schedules-api:0.1.0
          imagePullPolicy: IfNotPresent
          env:
            - { name: PORT, value: "3000" }
            - { name: NS, value: "argo" }
          ports:
            - { name: http, containerPort: 3000 }
          readinessProbe:
            tcpSocket: { port: 3000 }
            initialDelaySeconds: 3
            periodSeconds: 10
          livenessProbe:
            tcpSocket: { port: 3000 }
            initialDelaySeconds: 10
            periodSeconds: 20
          resources:
            requests: { cpu: "50m", memory: "64Mi" }
            limits: { cpu: "200m", memory: "256Mi" }
 ---
 apiVersion: v1
 kind: Service
 metadata:
  name: schedules-api
  namespace: argo
 spec:
  selector: { app: schedules-api }
  ports:
    - { name: http, port: 3000, targetPort: 3000 }
  type: ClusterIP
@@ -0,0 +1,47 @@
 apiVersion: v1
 kind: ServiceAccount
 metadata:
  name: schedules-api
  namespace: argo
 ---
 apiVersion: rbac.authorization.k8s.io/v1
 kind: Role
 metadata:
  name: schedules-api
  namespace: argo
 rules:
  - apiGroups: ["argoproj.io"]
    resources: ["cronworkflows"]
    verbs: ["create","get","list","watch","update","patch","delete"]
  - apiGroups: ["argoproj.io"]
    resources: ["workflows"]
    verbs: ["create","get","list"]
  - apiGroups: ["argoproj.io"]
    resources: ["workflowtemplates"]
    verbs: ["get","list"]
 ---
 # If you need ClusterWorkflowTemplate support, create this ClusterRole and a ClusterRoleBinding
 # with subject serviceAccountName: schedules-api, namespace: argo
 # apiVersion: rbac.authorization.k8s.io/v1
 # kind: ClusterRole
 # metadata:
 #   name: schedules-api-cwft-read
 # rules:
 #   - apiGroups: ["argoproj.io"]
 #     resources: ["clusterworkflowtemplates"]
 #     verbs: ["get","list"]
 ---
 apiVersion: rbac.authorization.k8s.io/v1
 kind: RoleBinding
 metadata:
  name: schedules-api
  namespace: argo
 subjects:
  - kind: ServiceAccount
    name: schedules-api
    namespace: argo
 roleRef:
  apiGroup: rbac.authorization.k8s.io
  kind: Role
  name: schedules-api
@@ -0,0 +1,17 @@
 apiVersion: argoproj.io/v1alpha1
 kind: WorkflowTemplate
 metadata:
  name: hello-template
  namespace: argo
 spec:
  entrypoint: run
  arguments:
    parameters:
      - { name: message, value: "hello from argo" }
  templates:
    - name: run
      container:
        image: alpine:3.19
        command: ["/bin/sh","-lc"]
        args: ["echo \"{{workflow.parameters.message}}\""]
@@ -0,0 +1,27 @@
 apiVersion: argoproj.io/v1alpha1
 kind: WorkflowTemplate
 metadata:
  name: ollama-job-template
  namespace: argo
 spec:
  entrypoint: run
  arguments:
    parameters:
      - { name: task, value: "quick-check" }
      - { name: prompt, value: "reindex embeddings" }
  templates:
    - name: run
      container:
        # Replace with an image that can reach your Ollama endpoint
        image: curlimages/curl:8.9.0
        command: ["/bin/sh","-lc"]
        args:
          - >-
            echo "task: {{workflow.parameters.task}}";
            echo "prompt: {{workflow.parameters.prompt}}";
            # Example call (adjust host/port or service DNS):
            # curl -s http://ollama.ai.svc.cluster.local:11434/api/generate \
            #   -H 'content-type: application/json' \
            #   -d '{"model":"llama3.1","prompt":"{{workflow.parameters.prompt}}"}' | tee /tmp/out.json;
            echo done.
@@ -0,0 +1,6 @@
 node_modules
 npm-cache
 bun.lockb
 .DS_Store
 *.log
@@ -0,0 +1,14 @@
 FROM oven/bun:1 as base
 WORKDIR /app
 # prod deps
 COPY package.json ./package.json
 RUN bun install --ci --production
 COPY server.mjs ./server.mjs
 USER bun
 EXPOSE 3000
 ENV NODE_ENV=production
 CMD ["bun", "run", "server.mjs"]
@@ -0,0 +1,14 @@
 {
  "name": "schedules-api",
  "version": "0.1.0",
  "private": true,
  "type": "module",
  "scripts": {
    "start": "bun run server.mjs",
    "dev": "bun run --hot server.mjs"
  },
  "dependencies": {
    "@kubernetes/client-node": "^0.22.1"
  }
 }
@@ -0,0 +1,123 @@
 // bun run server.mjs
 // tiny schedules api to manage argo cronworkflows/workflows via k8s CRDs
 // comments intentionally lowercase per original style
 import http from 'http'
 import { KubeConfig, CustomObjectsApi } from '@kubernetes/client-node'
 const GROUP = 'argoproj.io'
 const VERSION = 'v1alpha1'
 const CRON_PLURAL = 'cronworkflows'
 const WF_PLURAL = 'workflows'
 const NAMESPACE = process.env.NS || 'argo'
 // load cluster credentials (or fallback to local kubeconfig for dev)
 const kc = new KubeConfig()
 try { kc.loadFromCluster() } catch { kc.loadFromDefault() }
 const co = kc.makeApiClient(CustomObjectsApi)
 // helper: build cron string from an iso timestamp in a tz
 const cronFromISO = (iso, tz = 'America/New_York') => {
  const dt = new Date(iso)
  const parts = new Intl.DateTimeFormat('en-US', {
    timeZone: tz, year: 'numeric', month: 'numeric', day: 'numeric',
    hour: 'numeric', minute: '2-digit', hour12: false
  }).formatToParts(dt).reduce((a, p) => (a[p.type] = p.value, a), {})
  const m = Number(parts.month), d = Number(parts.day), h = Number(parts.hour), min = Number(parts.minute)
  return `${min} ${h} ${d} ${m} *`
 }
 // create or update a cronworkflow that runs a workflowtemplate
 async function upsertCronWorkflow({
  name, when, tz = 'America/New_York', oneShot = false,
  template = { name: '', clusterScope: false },
  parameters = {}, entrypoint
 }) {
  const schedule = when.cron ?? cronFromISO(when.iso, tz)
  const args = Object.entries(parameters).map(([name, value]) => ({ name, value }))
  const body = {
    apiVersion: `${GROUP}/${VERSION}`,
    kind: 'CronWorkflow',
    metadata: { name },
    spec: {
      timezone: tz,
      schedules: [schedule],
      concurrencyPolicy: 'Forbid',
      ...(oneShot ? { stopStrategy: { expression: 'cronworkflow.succeeded >= 1' } } : {}),
      workflowSpec: {
        ...(entrypoint ? { entrypoint } : {}),
        arguments: args.length ? { parameters: args } : undefined,
        workflowTemplateRef: {
          name: template.name,
          ...(template.clusterScope ? { clusterScope: true } : {})
        }
      }
    }
  }
  // try patch, else create
  try {
    await co.patchNamespacedCustomObject(
      GROUP, VERSION, NAMESPACE, CRON_PLURAL, name, body,
      undefined, undefined, undefined,
      { headers: { 'content-type': 'application/merge-patch+json' } }
    )
  } catch {
    await co.createNamespacedCustomObject(GROUP, VERSION, NAMESPACE, CRON_PLURAL, body)
  }
 }
 // run immediately (no schedule) by creating a workflow from the same template
 async function runNow({ name, template, parameters = {}, entrypoint }) {
  const args = Object.entries(parameters).map(([name, value]) => ({ name, value }))
  const wf = {
    apiVersion: `${GROUP}/${VERSION}`,
    kind: 'Workflow',
    metadata: { generateName: `${name}-` },
    spec: {
      ...(entrypoint ? { entrypoint } : {}),
      arguments: args.length ? { parameters: args } : undefined,
      workflowTemplateRef: {
        name: template.name,
        ...(template.clusterScope ? { clusterScope: true } : {})
      }
    }
  }
  await co.createNamespacedCustomObject(GROUP, VERSION, NAMESPACE, WF_PLURAL, wf)
 }
 // tiny http api
 const server = http.createServer(async (req, res) => {
  try {
    if (req.method === 'POST' && req.url === '/schedules') {
      const input = JSON.parse(await new Promise(r => {
        let d = ''; req.on('data', c => d += c); req.on('end', () => r(d))
      }))
      await upsertCronWorkflow(input)
      res.writeHead(201).end(JSON.stringify({ ok: true }))
      return
    }
    if (req.method === 'POST' && req.url === '/run-now') {
      const input = JSON.parse(await new Promise(r => {
        let d = ''; req.on('data', c => d += c); req.on('end', () => r(d))
      }))
      await runNow(input)
      res.writeHead(201).end(JSON.stringify({ ok: true }))
      return
    }
    if (req.method === 'DELETE' && req.url?.startsWith('/schedules/')) {
      const name = decodeURIComponent(req.url.split('/').pop())
      await co.deleteNamespacedCustomObject(GROUP, VERSION, NAMESPACE, CRON_PLURAL, name)
      res.writeHead(204).end()
      return
    }
    res.writeHead(404).end('not found')
  } catch (e) {
    res.writeHead(500).end(JSON.stringify({ ok: false, error: e.message }))
  }
 })
 const port = Number(process.env.PORT) || 3000
 server.listen(port, () => console.log(`schedules api listening on :${port}`))
@@ -13,3 +13,7 @@ docker push ion606/rag-server:latest;
 # tools
 docker build -t ion606/tools:latest ./tools;
 docker push ion606/tools:latest;
 # scheduling
 docker build -t ion606/ollama-scheduler:latest ./scheduler;
 docker push ion606/ollama-scheduler:latest;
@@ -12,6 +12,8 @@ minikube addons enable ingress-dns;
 # namespaces
 kubectl create namespace argocd --dry-run=client -o yaml | kubectl apply -f -;
 kubectl create namespace ai --dry-run=client -o yaml | kubectl apply -f -;
 # argo workflows namespace (for cronworkflows/workflows + templates)
 kubectl create namespace argo --dry-run=client -o yaml | kubectl apply -f -;
 # install argo cd (stable manifest)
 # https://argo-cd.readthedocs.io/en/stable/operator-manual/installation/