# Ollama Deployment with GPU # Требования: NVIDIA GPU Operator установлен в кластере --- apiVersion: apps/v1 kind: Deployment metadata: name: ollama namespace: gooseek labels: app: ollama app.kubernetes.io/name: ollama app.kubernetes.io/part-of: gooseek spec: replicas: 1 selector: matchLabels: app: ollama template: metadata: labels: app: ollama spec: runtimeClassName: nvidia containers: # Ollama server (только GPU) - name: ollama image: ollama/ollama:latest ports: - containerPort: 11434 name: http env: - name: OLLAMA_HOST value: "0.0.0.0:11434" - name: OLLAMA_KEEP_ALIVE value: "24h" - name: OLLAMA_MODELS value: "/root/.ollama/models" # Параллельная обработка для SaaS - name: OLLAMA_NUM_PARALLEL value: "4" - name: OLLAMA_MAX_LOADED_MODELS value: "2" - name: OLLAMA_FLASH_ATTENTION value: "true" # GPU - name: NVIDIA_VISIBLE_DEVICES value: "all" - name: NVIDIA_DRIVER_CAPABILITIES value: "compute,utility" volumeMounts: - name: ollama-data mountPath: /root/.ollama resources: requests: cpu: 1000m memory: 8Gi nvidia.com/gpu: 1 limits: cpu: 4000m memory: 16Gi nvidia.com/gpu: 1 livenessProbe: httpGet: path: / port: 11434 initialDelaySeconds: 30 periodSeconds: 30 timeoutSeconds: 5 readinessProbe: httpGet: path: / port: 11434 initialDelaySeconds: 10 periodSeconds: 10 timeoutSeconds: 5 volumes: - name: ollama-data persistentVolumeClaim: claimName: ollama-pvc --- apiVersion: v1 kind: PersistentVolumeClaim metadata: name: ollama-pvc namespace: gooseek spec: accessModes: - ReadWriteOnce resources: requests: storage: 20Gi --- apiVersion: v1 kind: Service metadata: name: ollama namespace: gooseek spec: type: ClusterIP selector: app: ollama ports: - port: 11434 targetPort: 11434 name: http --- # NetworkPolicy: llm-svc и model-loader могут обращаться к ollama apiVersion: networking.k8s.io/v1 kind: NetworkPolicy metadata: name: ollama-access namespace: gooseek spec: podSelector: matchLabels: app: ollama policyTypes: - Ingress ingress: - from: - podSelector: matchLabels: app: llm-svc - podSelector: matchLabels: app: ollama-model-loader ports: - protocol: TCP port: 11434