Skip to content

Commit 336441e

Browse files
committed
refactored limits
1 parent 474f7b4 commit 336441e

File tree

1 file changed

+5
-3
lines changed

1 file changed

+5
-3
lines changed

charts/azimuth-llm/templates/api/deployment.yml

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -62,10 +62,12 @@ spec:
6262
periodSeconds: 10
6363
resources:
6464
limits:
65-
{{- if .Values.api.intelXPUsEnabled }}
66-
gpu.intel.com/i915: {{ .Values.api.gpus | int }}
65+
{{- if eq (.Values.api.gpus | int) 0 }}
66+
image: "ghcr.io/stackhpc/vllm-cpu"
67+
{{- else if .Values.api.intelXPUsEnabled }}
68+
image: "ghcr.io/stackhpc/vllm-xpu"
6769
{{- else }}
68-
nvidia.com/gpu: {{ .Values.api.gpus | int }}
70+
image: "vllm/vllm-openai"
6971
{{- end }}
7072
volumes:
7173
- name: data

0 commit comments

Comments
 (0)