Compare commits

...

24 commits

Author SHA1 Message Date
28c98bb835 Update docker.io/ollama/ollama Docker tag to v0.2.7 2024-07-18 20:32:13 +00:00
47629d98e4
MOAR! 2024-07-18 13:50:21 -05:00
7c13632d90
all the way up 2024-07-18 13:39:28 -05:00
ad56cff785
Update mount paths. 2024-07-18 12:50:55 -05:00
62a468c65d
reloader and single strat 2024-07-18 11:45:40 -05:00
9e2843db6d
update values vs config 2024-07-18 11:38:59 -05:00
3164ed8cc3
mixed 2024-07-18 11:01:06 -05:00
3c7fc961e2
multiple gpu apps per card 2024-07-18 10:54:49 -05:00
9a5dd3b499
Add Stable Diffusion - ComfyUI 2024-07-18 10:33:15 -05:00
09bb62a3eb
Update. 2024-07-17 19:24:54 -05:00
5de65b8feb
Update settings for websearch. 2024-07-17 19:06:23 -05:00
b6fca7d5f9
Update deprecated plugin 2024-07-17 18:52:21 -05:00
7a641c2484
disable limiter. 2024-07-17 18:26:23 -05:00
abc80d9e74
reduce settings 2024-07-17 18:24:12 -05:00
9a5876dc3f
add pod network 2024-07-17 18:14:10 -05:00
826d7f5c23
Add websearch to open-webui. 2024-07-17 18:07:08 -05:00
18196d4a64
forgot to include secret 2024-07-17 17:06:03 -05:00
e42c8bc664
no string? 2024-07-17 17:04:39 -05:00
ce3e10c530
Correct file extension. 2024-07-17 17:02:49 -05:00
83db39c83f
Add Searxng. 2024-07-17 17:00:17 -05:00
e9dae245c7
Add privileged movers 2024-07-17 16:08:43 -05:00
6633145379
update base url 2024-07-17 15:03:14 -05:00
3ebcf13282
Add Open-WebUI for AI chat. 2024-07-17 14:54:16 -05:00
09642a8de9
Lets keep those models loaded for a bit longer. 2024-07-17 14:10:25 -05:00
20 changed files with 512 additions and 15 deletions

View file

@ -7,3 +7,5 @@ resources:
- ./namespace.yaml - ./namespace.yaml
# Flux-Kustomizations # Flux-Kustomizations
- ./ollama/ks.yaml - ./ollama/ks.yaml
- ./open-webui/ks.yaml
- ./stable-diffusion/ks.yaml

View file

@ -5,3 +5,4 @@ metadata:
name: ai name: ai
labels: labels:
kustomize.toolkit.fluxcd.io/prune: disabled kustomize.toolkit.fluxcd.io/prune: disabled
volsync.backube/privileged-movers: "true"

View file

@ -35,7 +35,7 @@ spec:
app: app:
image: image:
repository: docker.io/ollama/ollama repository: docker.io/ollama/ollama
tag: 0.2.5 tag: 0.2.7
env: env:
- name: OLLAMA_HOST - name: OLLAMA_HOST
value: 0.0.0.0 value: 0.0.0.0
@ -43,6 +43,8 @@ spec:
value: "*" value: "*"
- name: OLLAMA_MODELS - name: OLLAMA_MODELS
value: &modelPath "/models" value: &modelPath "/models"
- name: OLLAMA_KEEP_ALIVE
value: "24h"
resources: resources:
requests: requests:
nvidia.com/gpu: 1 # requesting 1 GPU nvidia.com/gpu: 1 # requesting 1 GPU

View file

@ -0,0 +1,77 @@
---
# yaml-language-server: $schema=https://raw.githubusercontent.com/bjw-s/helm-charts/main/charts/other/app-template/schemas/helmrelease-helm-v2beta2.schema.json
apiVersion: helm.toolkit.fluxcd.io/v2
kind: HelmRelease
metadata:
name: &app open-webui
spec:
interval: 30m
chart:
spec:
chart: app-template
version: 3.2.1
sourceRef:
kind: HelmRepository
name: bjw-s
namespace: flux-system
dependsOn:
- name: ollama
install:
remediation:
retries: 3
upgrade:
cleanupOnFail: true
remediation:
retries: 3
strategy: rollback
values:
controllers:
open-webui:
annotations:
reloader.stakater.com/auto: "true"
containers:
app:
image:
repository: ghcr.io/open-webui/open-webui
tag: git-82079e6
env:
- name: OLLAMA_BASE_URL
value: http://ollama.ai.svc.cluster.local:11434
- name: ENABLE_RAG_WEB_SEARCH
value: true
- name: RAG_WEB_SEARCH_ENGINE
value: searxng
- name: SEARXNG_QUERY_URL
value: http://searxng.default.svc.cluster.local:8080/search?q=<query>
resources:
requests:
cpu: 500m
memory: 2Gi
limits:
memory: 2Gi
service:
app:
controller: open-webui
ports:
http:
port: 8080
ingress:
app:
enabled: true
className: internal-nginx
hosts:
- host: &host "chat.jahanson.tech"
paths:
- path: /
service:
identifier: app
port: http
tls:
- hosts:
- *host
persistence:
config:
enabled: true
existingClaim: *app
globalMounts:
- path: /app/backend/data

View file

@ -0,0 +1,7 @@
---
# yaml-language-server: $schema=https://json.schemastore.org/kustomization
apiVersion: kustomize.config.k8s.io/v1beta1
kind: Kustomization
resources:
- ./helmrelease.yaml
- ../../../../templates/volsync

View file

@ -0,0 +1,28 @@
---
# yaml-language-server: $schema=https://ks.hsn.dev/kustomize.toolkit.fluxcd.io/kustomization_v1.json
apiVersion: kustomize.toolkit.fluxcd.io/v1
kind: Kustomization
metadata:
name: &app open-webui
namespace: flux-system
spec:
targetNamespace: ai
commonMetadata:
labels:
app.kubernetes.io/name: *app
dependsOn:
- name: volsync
- name: ollama
path: ./kubernetes/apps/ai/open-webui/app
prune: true
sourceRef:
kind: GitRepository
name: homelab
wait: false
interval: 30m
retryInterval: 1m
timeout: 5m
postBuild:
substitute:
APP: *app
VOLSYNC_CAPACITY: 5Gi

View file

@ -0,0 +1,82 @@
---
# yaml-language-server: $schema=https://raw.githubusercontent.com/bjw-s/helm-charts/main/charts/other/app-template/schemas/helmrelease-helm-v2beta2.schema.json
apiVersion: helm.toolkit.fluxcd.io/v2
kind: HelmRelease
metadata:
name: &app comfyui
spec:
interval: 30m
chart:
spec:
chart: app-template
version: 3.2.1
sourceRef:
kind: HelmRepository
name: bjw-s
namespace: flux-system
install:
remediation:
retries: 3
upgrade:
cleanupOnFail: true
remediation:
retries: 3
strategy: rollback
values:
controllers:
comfyui:
annotations:
reloader.stakater.com/auto: "true"
pod:
nodeSelector:
nvidia.com/gpu.present: "true"
runtimeClassName: nvidia
containers:
app:
image:
repository: docker.io/jahanson/comfyui
tag: v0.0.1
resources:
requests:
nvidia.com/gpu: 1 # requesting 1 GPU
cpu: 500m
memory: 2Gi
limits:
memory: 60Gi
nvidia.com/gpu: 1 # requesting 1 GPU
service:
app:
controller: comfyui
ports:
http:
port: 7860
ingress:
app:
enabled: true
className: internal-nginx
hosts:
- host: &host "{{ .Release.Name }}.jahanson.tech"
paths:
- path: /
service:
identifier: app
port: http
tls:
- hosts:
- *host
persistence:
models:
enabled: true
existingClaim: stablediffusion-checkpoints
globalMounts:
- path: /data/models
config:
enabled: true
existingClaim: comfyui
globalMounts:
- path: /data/config
output:
enabled: true
type: emptyDir
globalMounts:
- path: /output

View file

@ -0,0 +1,8 @@
---
# yaml-language-server: $schema=https://json.schemastore.org/kustomization
apiVersion: kustomize.config.k8s.io/v1beta1
kind: Kustomization
resources:
- ./helmrelease.yaml
- ./pvc.yaml
- ../../../../templates/volsync

View file

@ -0,0 +1,12 @@
---
apiVersion: v1
kind: PersistentVolumeClaim
metadata:
name: stablediffusion-checkpoints
spec:
accessModes:
- ReadWriteOnce
resources:
requests:
storage: 300Gi
storageClassName: openebs-hostpath

View file

@ -0,0 +1,30 @@
---
# yaml-language-server: $schema=https://ks.hsn.dev/kustomize.toolkit.fluxcd.io/kustomization_v1.json
apiVersion: kustomize.toolkit.fluxcd.io/v1
kind: Kustomization
metadata:
name: &app comfyui
namespace: flux-system
spec:
targetNamespace: ai
commonMetadata:
labels:
app.kubernetes.io/name: *app
dependsOn:
- name: nvidia-device-plugin
- name: node-feature-discovery
- name: volsync
- name: openebs
path: ./kubernetes/apps/ai/stable-diffusion/comfyui
prune: true
sourceRef:
kind: GitRepository
name: homelab
wait: false
interval: 30m
retryInterval: 1m
timeout: 5m
postBuild:
substitute:
APP: *app
VOLSYNC_CAPACITY: 5Gi

View file

@ -13,6 +13,7 @@ resources:
- ./radarr/ks.yaml - ./radarr/ks.yaml
- ./recyclarr/ks.yaml - ./recyclarr/ks.yaml
- ./sabnzbd/ks.yaml - ./sabnzbd/ks.yaml
- ./searxng/ks.yaml
- ./sonarr/ks.yaml - ./sonarr/ks.yaml
- ./tautulli/ks.yaml - ./tautulli/ks.yaml
- ./unpackerr/ks.yaml - ./unpackerr/ks.yaml

View file

@ -0,0 +1,19 @@
---
# yaml-language-server: $schema=https://ks.hsn.dev/external-secrets.io/externalsecret_v1beta1.json
apiVersion: external-secrets.io/v1beta1
kind: ExternalSecret
metadata:
name: searxng
spec:
secretStoreRef:
kind: ClusterSecretStore
name: onepassword-connect
target:
name: searxng-secret
template:
engineVersion: v2
data:
SEARXNG_SECRET: "{{ .SEARXNG_SECRET }}"
dataFrom:
- extract:
key: searxng

View file

@ -0,0 +1,112 @@
---
# yaml-language-server: $schema=https://raw.githubusercontent.com/bjw-s/helm-charts/main/charts/other/app-template/schemas/helmrelease-helm-v2beta2.schema.json
apiVersion: helm.toolkit.fluxcd.io/v2
kind: HelmRelease
metadata:
name: searxng
spec:
interval: 30m
chart:
spec:
chart: app-template
version: 3.2.1
sourceRef:
kind: HelmRepository
name: bjw-s
namespace: flux-system
install:
remediation:
retries: 3
upgrade:
cleanupOnFail: true
remediation:
retries: 3
strategy: rollback
values:
controllers:
searxng:
annotations:
reloader.stakater.com/auto: "true"
containers:
app:
image:
repository: docker.io/searxng/searxng
tag: 2024.7.7-ef103ba80
envFrom:
- secretRef:
name: searxng-secret
env:
TZ: America/Chicago
SEARXNG_BASE_URL: https://search.jahanson.tech
SEARXNG_URL: https://search.jahanson.tech
SEARXNG_PORT: &port 8080
probes:
liveness: &probes
enabled: true
custom: true
spec:
httpGet:
path: /stats
port: *port
initialDelaySeconds: 0
periodSeconds: 10
timeoutSeconds: 1
failureThreshold: 3
readiness: *probes
startup:
enabled: false
securityContext:
allowPrivilegeEscalation: false
readOnlyRootFilesystem: true
capabilities:
drop:
- ALL
add:
- CHOWN
- SETGID
- SETUID
- DAC_OVERRIDE
resources:
requests:
cpu: 10m
limits:
memory: 3Gi
service:
app:
controller: searxng
ports:
http:
port: *port
ingress:
app:
enabled: true
className: internal-nginx
hosts:
- host: &host "search.jahanson.tech"
paths:
- path: /
service:
identifier: app
port: http
tls:
- hosts:
- *host
persistence:
config:
type: configMap
name: searxng-configmap
advancedMounts:
searxng:
app:
- path: /etc/searxng/settings.yml
subPath: settings.yml
readOnly: true
- path: /etc/searxng/limiter.toml
subPath: limiter.toml
readOnly: true
tmp:
type: emptyDir
advancedMounts:
searxng:
app:
- path: /etc/searxng

View file

@ -0,0 +1,14 @@
---
# yaml-language-server: $schema=https://json.schemastore.org/kustomization
apiVersion: kustomize.config.k8s.io/v1beta1
kind: Kustomization
resources:
- ./externalsecret.yaml
- ./helmrelease.yaml
configMapGenerator:
- name: searxng-configmap
files:
- settings.yml=./resources/settings.yml
- limiter.toml=./resources/limiter.toml
generatorOptions:
disableNameSuffixHash: true

View file

@ -0,0 +1,6 @@
# This configuration file updates the default configuration file
# See https://github.com/searxng/searxng/blob/master/searx/limiter.toml
[botdetection.ip_limit]
# activate link_token method in the ip_limit method
link_token = true

View file

@ -0,0 +1,51 @@
---
use_default_settings: true
server:
limiter: false
image_proxy: true
redis:
url: redis://dragonfly.database.svc.cluster.local:6379?db=10
search:
safe_search: 0
autocomplete: brave
formats:
- html
- json
general:
instance_name: HansonSearch
ui:
static_use_hash: true
default_theme: simple
theme_args:
simple_style: dark
infinite_scroll: true
results_on_new_tab: true
enabled_plugins:
- Basic Calculator
- Hash plugin
- Hostnames plugin
- Open Access DOI rewrite
- Self Informations
- Tracker URL remover
- Unit converter plugin
hostnames:
high_priority:
- (.*)\/blog\/(.*)
- (.*\.)?wikipedia.org$
- (.*\.)?github.com$
- (.*\.)?reddit.com$
- (.*\.)?linuxserver.io$
- (.*\.)?docker.com$
- (.*\.)?archlinux.org$
- (.*\.)?stackoverflow.com$
- (.*\.)?askubuntu.com$
- (.*\.)?superuser.com$
# replace:
# (www\.)?reddit\.com$: redlib.rostvik.site

View file

@ -0,0 +1,27 @@
---
# yaml-language-server: $schema=https://ks.hsn.dev/kustomize.toolkit.fluxcd.io/kustomization_v1.json
apiVersion: kustomize.toolkit.fluxcd.io/v1
kind: Kustomization
metadata:
name: &app searxng
namespace: flux-system
spec:
targetNamespace: default
commonMetadata:
labels:
app.kubernetes.io/name: *app
dependsOn:
- name: dragonfly
- name: external-secrets-stores
path: ./kubernetes/apps/default/searxng/app
prune: true
sourceRef:
kind: GitRepository
name: homelab
wait: false
interval: 30m
retryInterval: 1m
timeout: 5m
postBuild:
substitute:
APP: *app

View file

@ -14,6 +14,9 @@ spec:
kind: HelmRepository kind: HelmRepository
name: nvdp name: nvdp
namespace: flux-system namespace: flux-system
metadata:
annotations:
reloader.stakater.com/auto: "true"
install: install:
remediation: remediation:
retries: 3 retries: 3
@ -22,6 +25,18 @@ spec:
remediation: remediation:
retries: 3 retries: 3
strategy: rollback strategy: rollback
valuesFrom: values:
- kind: ConfigMap podAnnotations:
configmap.reloader.stakater.com/reload: nvidia-helm-values
config:
name: nvidia-helm-values name: nvidia-helm-values
runtimeClassName: "nvidia"
gfd:
enabled: true
nfd:
enabled: false
resources:
requests:
cpu: 100m
limits:
memory: 512Mi

View file

@ -1,10 +1,12 @@
runtimeClassName: "nvidia" ---
gfd: version: v1
enabled: false flags:
nfd: migStrategy: "single"
enabled: false plugin:
resources: deviceListStrategy: "envvar"
requests: deviceIDStrategy: "uuid"
cpu: 100m sharing:
limits: timeSlicing:
memory: 512Mi resources:
- name: nvidia.com/gpu
replicas: 3

View file

@ -5,3 +5,4 @@ metadata:
name: qbittorrent name: qbittorrent
labels: labels:
kustomize.toolkit.fluxcd.io/prune: disabled kustomize.toolkit.fluxcd.io/prune: disabled
volsync.backube/privileged-movers: "true"