Skip to content
Closed
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions helm-charts/audioqna/cpu-multilang-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@ tgi:
enabled: false
vllm:
enabled: true
VLLM_CPU_OMP_THREADS_BIND: all

speecht5:
enabled: false
Expand Down
1 change: 1 addition & 0 deletions helm-charts/audioqna/cpu-values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@ tgi:
enabled: false
vllm:
enabled: true
VLLM_CPU_OMP_THREADS_BIND: all

speecht5:
enabled: true
Expand Down
3 changes: 3 additions & 0 deletions helm-charts/common/vllm/templates/configmap.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -27,6 +27,9 @@ data:
{{- if .Values.VLLM_CPU_KVCACHE_SPACE }}
VLLM_CPU_KVCACHE_SPACE: {{ .Values.VLLM_CPU_KVCACHE_SPACE | quote}}
{{- end }}
{{- if .Values.VLLM_CPU_OMP_THREADS_BIND }}
VLLM_CPU_OMP_THREADS_BIND: {{ .Values.VLLM_CPU_OMP_THREADS_BIND | quote}}
{{- end }}
{{- if .Values.VLLM_SKIP_WARMUP }}
VLLM_SKIP_WARMUP: {{ .Values.VLLM_SKIP_WARMUP | quote }}
{{- end }}
Expand Down
1 change: 1 addition & 0 deletions helm-charts/common/vllm/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -107,6 +107,7 @@ LLM_MODEL_ID: meta-llama/Meta-Llama-3-8B-Instruct
OMPI_MCA_btl_vader_single_copy_mechanism: ""
PT_HPU_ENABLE_LAZY_COLLECTIVES: ""
VLLM_CPU_KVCACHE_SPACE: ""
VLLM_CPU_OMP_THREADS_BIND: ""

global:
http_proxy: ""
Expand Down