From c6bae35bc6f7749aacbe6215626ad6308fcfd0a4 Mon Sep 17 00:00:00 2001 From: Brad Stein Date: Sun, 21 Dec 2025 00:47:57 -0300 Subject: [PATCH] chore(ai-llm): annotate pod with model and gpu --- services/ai-llm/deployment.yaml | 3 +++ 1 file changed, 3 insertions(+) diff --git a/services/ai-llm/deployment.yaml b/services/ai-llm/deployment.yaml index d78315b..fb0d0e7 100644 --- a/services/ai-llm/deployment.yaml +++ b/services/ai-llm/deployment.yaml @@ -14,6 +14,9 @@ spec: metadata: labels: app: ollama + annotations: + ai.bstein.dev/model: qwen2.5-coder:7b-instruct-q4_0 + ai.bstein.dev/gpu: RTX 3080 8GB (titan-24) spec: nodeSelector: kubernetes.io/hostname: titan-24