theshire/kubernetes/apps/ai/ollama/app/helmrelease.yaml

---
# yaml-language-server: $schema=https://raw.githubusercontent.com/bjw-s/helm-charts/main/charts/other/app-template/schemas/helmrelease-helm-v2beta2.schema.json
apiVersion: helm.toolkit.fluxcd.io/v2
kind: HelmRelease
metadata:
  name: &app ollama
spec:
  interval: 30m
  chart:
    spec:
      chart: app-template
      version: 3.5.1
      sourceRef:
        kind: HelmRepository
        name: bjw-s
        namespace: flux-system
  install:
    remediation:
      retries: 3
  upgrade:
    cleanupOnFail: true
    remediation:
      retries: 3
      strategy: rollback
  values:
    controllers:
      ollama:
        annotations:
          reloader.stakater.com/auto: "true"
        pod:
          nodeSelector:
            nvidia.com/gpu.present: "true"
          runtimeClassName: nvidia
        containers:
          app:
            image:
              repository: docker.io/ollama/ollama
              tag: 0.3.12
            env:
              - name: OLLAMA_HOST
                value: 0.0.0.0
              - name: OLLAMA_ORIGINS
                value: "*"
              - name: OLLAMA_MODELS
                value: &modelPath "/models"
              - name: OLLAMA_KEEP_ALIVE
                value: "24h"
            resources:
              requests:
                nvidia.com/gpu: 1 # requesting 1 GPU
                cpu: 500m
                memory: 2Gi
              limits:
                memory: 16Gi
                nvidia.com/gpu: 1 # requesting 1 GPU
    service:
      app:
        controller: ollama
        ports:
          http:
            port: 11434
    ingress:
      app:
        enabled: true
        className: internal-nginx
        hosts:
          - host: &host "{{ .Release.Name }}.jahanson.tech"
            paths:
              - path: /
                service:
                  identifier: app
                  port: http
        tls:
          - hosts:
              - *host
    persistence:
      models:
        enabled: true
        existingClaim: ollama-models
        advancedMounts:
          ollama:
            app:
              - path: *modelPath
      config:
        enabled: true
        existingClaim: ollama
        globalMounts:
          - path: /root/.ollama