opea-project · chensuyue · Aug 22, 2025 · Jul 1, 2025 · Jul 14, 2025 · Jul 14, 2025
@@ -21,13 +21,16 @@ dependencies:
   - name: llm-uservice
     version: 0-latest
     repository: "file://../common/llm-uservice"
+    condition: llm-uservice.enabled
   - name: whisper
     version: 0-latest
     repository: "file://../common/whisper"
+    condition: whisper.enabled
   - name: ui
     version: 0-latest
     repository: "file://../common/ui"
     alias: docsum-ui
+    condition: docsum-ui.enabled
   - name: nginx
     version: 0-latest
     repository: "file://../common/nginx"

@@ -26,7 +26,11 @@ helm install docsum docsum --set global.HF_TOKEN=${HFTOKEN} --set global.modelUs
 # helm install docsum docsum --set global.HF_TOKEN=${HFTOKEN} --values docsum/rocm-values.yaml
 # To use AMD ROCm device with TGI
 # helm install docsum docsum --set global.HF_TOKEN=${HFTOKEN} --values docsum/rocm-tgi-values.yaml
-
+# To use with external OpenAI-compatible LLM endpoints (OpenAI, vLLM, TGI, etc.)
+# This configures the llm-uservice to connect to external LLM providers while maintaining DocSum compatibility
+# helm install docsum docsum --set global.HF_TOKEN=${HFTOKEN} --values docsum/variant_external-llm-values.yaml --set llm-uservice.env.OPENAI_API_KEY="your-api-key" --set llm-uservice.env.LLM_MODEL_ID="gpt-4-turbo"
+# For vLLM/TGI endpoints:
+# helm install docsum docsum --set global.HF_TOKEN=${HFTOKEN} --values docsum/variant_external-llm-values.yaml --set llm-uservice.env.LLM_ENDPOINT="http://your-vllm-server/v1" --set llm-uservice.env.LLM_MODEL_ID="your-model"
 ```
 
 ## Verify

@@ -38,10 +38,12 @@ spec:
               value: {{ include "llm-uservice.fullname" (index .Subcharts "llm-uservice") }}
             - name: LLM_SERVICE_PORT
               value: {{ index .Values "llm-uservice" "service" "port" | quote }}
+            {{- if .Values.whisper.enabled }}
             - name: ASR_SERVICE_HOST_IP
               value: {{ include "whisper.fullname" (index .Subcharts "whisper") }}
             - name: ASR_SERVICE_PORT
               value: {{ index .Values "whisper" "service" "port" | quote }}
+            {{- end }}
           securityContext:
             {{- toYaml .Values.securityContext | nindent 12 }}
           image: "{{ .Values.image.repository }}:{{ .Values.image.tag | default .Chart.AppVersion }}"

@@ -58,6 +58,7 @@ affinity: {}
 
 # To override values in subchart llm-uservice
 llm-uservice:
+  enabled: true
   image:
     repository: opea/llm-docsum
   DOCSUM_BACKEND: "vLLM"
@@ -79,6 +80,8 @@ vllm:
 nginx:
   enabled: false
 docsum-ui:
+  # if false, set also nginx.enabled=false
+  enabled: true
   image:
     repository: opea/docsum-gradio-ui
     tag: "latest"
@@ -101,8 +104,20 @@ docsum-ui:
 #     type: ClusterIP
 
 dashboard:
+  enabled: true
   prefix: "OPEA DocSum"
 
+whisper:
+  enabled: true
+
+# External LLM configuration
+externalLLM:
+  enabled: false
+  LLM_SERVER_HOST: "http://your-llm-server"
+  LLM_SERVER_PORT: "80"
+  LLM_MODEL: "your-model"
+  OPENAI_API_KEY: "your-api-key"
+
 global:
   http_proxy: ""
   https_proxy: ""

@@ -0,0 +1,19 @@
+# Copyright (C) 2024 Intel Corporation
-# Copyright (C) 2024 Intel Corporation
+# Copyright (C) 2025 Intel Corporation
-# Copyright (C) 2024 Intel Corporation
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+# External LLM configuration - configures llm-uservice to use external LLM providers
+# This keeps the llm-uservice wrapper (required for /v1/docsum endpoint) but connects it to external LLMs
+llm-uservice:
+  enabled: true  # Keep the wrapper service for DocSum compatibility
+  env:
+    # Configure llm-uservice to use external OpenAI-compatible endpoints
+    LLM_ENDPOINT: "https://api.openai.com/v1"  # External LLM API endpoint (OpenAI, vLLM, TGI, etc.)
+    OPENAI_API_KEY: "${OPENAI_API_KEY}"        # API key for authentication
+    LLM_MODEL_ID: "gpt-4-turbo"               # Model to use
+    TEXTGEN_BACKEND: "openai"                  # Backend type for OpenAI-compatible endpoints
+
+# Disable local inference services since we're using external LLMs
+vllm:
+  enabled: false
+tgi:
+  enabled: false