- Add namespace, PVC, deployment, service, and kustomization for Ollama - ClusterIP only (internal), no ingress - 10Gi PVC mounted at /root/.ollama - Resource limits: 700Mi-1500Mi memory, 500m-1000m CPU - Add ArgoCD Application CR for ollama - Update backend configmap with OLLAMA_BASE_URL and OLLAMA_CHAT_MODEL
40 lines
No EOL
870 B
YAML
40 lines
No EOL
870 B
YAML
apiVersion: apps/v1
|
|
kind: Deployment
|
|
metadata:
|
|
name: ollama
|
|
namespace: nxtgauge-ai
|
|
labels:
|
|
app: ollama
|
|
spec:
|
|
replicas: 1
|
|
selector:
|
|
matchLabels:
|
|
app: ollama
|
|
template:
|
|
metadata:
|
|
labels:
|
|
app: ollama
|
|
spec:
|
|
containers:
|
|
- name: ollama
|
|
image: ollama/ollama:latest
|
|
ports:
|
|
- containerPort: 11434
|
|
name: http
|
|
env:
|
|
- name: OLLAMA_HOST
|
|
value: "0.0.0.0:11434"
|
|
volumeMounts:
|
|
- name: ollama-models
|
|
mountPath: /root/.ollama
|
|
resources:
|
|
requests:
|
|
cpu: 500m
|
|
memory: 700Mi
|
|
limits:
|
|
cpu: 1000m
|
|
memory: 1500Mi
|
|
volumes:
|
|
- name: ollama-models
|
|
persistentVolumeClaim:
|
|
claimName: ollama-models |