Skip to content

Commit

Permalink
Use official vLLM image
Browse files Browse the repository at this point in the history
  • Loading branch information
sd109 committed Dec 12, 2023
1 parent 6876068 commit 50870e0
Show file tree
Hide file tree
Showing 2 changed files with 7 additions and 4 deletions.
3 changes: 2 additions & 1 deletion templates/api/deployment.yml
Original file line number Diff line number Diff line change
Expand Up @@ -26,12 +26,13 @@ spec:
- name: data
mountPath: /root/.cache/huggingface
command:
- python3.11
- python3
args:
- -m
- vllm.entrypoints.api_server
- --model
- {{ .Values.huggingface.model }}
{{- .Values.api.extraArgs | toYaml | nindent 10 }}
{{- if .Values.huggingface.secretName }}
envFrom:
- secretRef:
Expand Down
8 changes: 5 additions & 3 deletions values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -30,7 +30,7 @@ api:
# Container image config
image:
repository: ghcr.io/stackhpc/azimuth-llm-api-base
version: fae060a
version: "6876068"
# Service config
service:
name: text-generation-inference
Expand Down Expand Up @@ -61,13 +61,15 @@ api:
rollingUpdate:
maxSurge: 0%
maxUnavailable: 100%

# Extra args to supply to the vLLM backend
extraArgs: []

# Configuration for the frontend web interface
ui:
# Container image config
image:
repository: ghcr.io/stackhpc/azimuth-llm-ui-base
version: 7b1d77f
version: "6876068"
# Service config
service:
name: web-app
Expand Down

0 comments on commit 50870e0

Please sign in to comment.