diff --git a/services/ai-llm/deployment.yaml b/services/ai-llm/deployment.yaml index d78315b..fb0d0e7 100644 --- a/services/ai-llm/deployment.yaml +++ b/services/ai-llm/deployment.yaml @@ -14,6 +14,9 @@ spec: metadata: labels: app: ollama + annotations: + ai.bstein.dev/model: qwen2.5-coder:7b-instruct-q4_0 + ai.bstein.dev/gpu: RTX 3080 8GB (titan-24) spec: nodeSelector: kubernetes.io/hostname: titan-24