alexsin368
diff --git a/‎.github/code_spell_ignore.txt‎
Lines changed: 2 additions & 1 deletion b/‎.github/code_spell_ignore.txt‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎.github/env/_build_image.sh‎
Lines changed: 2 additions & 1 deletion b/‎.github/env/_build_image.sh‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎.github/workflows/_gmc-e2e.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/_gmc-e2e.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/_run-docker-compose.yml‎
Lines changed: 2 additions & 2 deletions b/‎.github/workflows/_run-docker-compose.yml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎.set_env.sh‎
Lines changed: 1 addition & 0 deletions b/‎.set_env.sh‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎AgentQnA/README.md‎
Lines changed: 1 addition & 1 deletion b/‎AgentQnA/README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎AgentQnA/docker_compose/amd/gpu/rocm/README.md‎
Lines changed: 1 addition & 1 deletion b/‎AgentQnA/docker_compose/amd/gpu/rocm/README.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎AgentQnA/docker_compose/amd/gpu/rocm/compose.yaml‎
Lines changed: 5 additions & 5 deletions b/‎AgentQnA/docker_compose/amd/gpu/rocm/compose.yaml‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎AgentQnA/docker_compose/amd/gpu/rocm/compose_vllm.yaml‎
Lines changed: 5 additions & 5 deletions b/‎AgentQnA/docker_compose/amd/gpu/rocm/compose_vllm.yaml‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎AgentQnA/docker_compose/amd/gpu/rocm/launch_agent_service_tgi_rocm.sh‎
Lines changed: 4 additions & 3 deletions b/‎AgentQnA/docker_compose/amd/gpu/rocm/launch_agent_service_tgi_rocm.sh‎
Lines changed: 4 additions & 3 deletions
@@ -1,3 +1,4 @@
 ModelIn
 modelin
-pressEnter
+pressEnter
+PromptIn
@@ -1,5 +1,6 @@
+#!/bin/bash
 # Copyright (C) 2025 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-export VLLM_VER=v0.8.3
+export VLLM_VER=v0.9.0.1
 export VLLM_FORK_VER=v0.6.6.post1+Gaudi-1.20.0
@@ -56,7 +56,7 @@ jobs:
       - name: Run tests
         id: run-test
         env:
-          HUGGINGFACEHUB_API_TOKEN: ${{ secrets.HUGGINGFACEHUB_API_TOKEN }}
+          HF_TOKEN: ${{ secrets.HF_TOKEN }}
           GOOGLE_CSE_ID: ${{ secrets.GOOGLE_CSE_ID }}
           GOOGLE_API_KEY: ${{ secrets.GOOGLE_API_KEY }}
         run: |
 
@@ -170,8 +170,8 @@ jobs:
       - name: Run test
         shell: bash
         env:
-          HUGGINGFACEHUB_API_TOKEN: ${{ secrets.HUGGINGFACEHUB_API_TOKEN }}
-          HF_TOKEN: ${{ secrets.HUGGINGFACEHUB_API_TOKEN }}
+          HUGGINGFACEHUB_API_TOKEN: ${{ secrets.HF_TOKEN }}
+          HF_TOKEN: ${{ secrets.HF_TOKEN }}
           GOOGLE_CSE_ID: ${{ secrets.GOOGLE_CSE_ID }}
           GOOGLE_API_KEY: ${{ secrets.GOOGLE_API_KEY }}
           PINECONE_KEY: ${{ secrets.PINECONE_KEY }}
 
@@ -1,3 +1,4 @@
+#!/bin/bash
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 #
 
@@ -123,7 +123,7 @@ Set up a [HuggingFace](https://huggingface.co/) account and generate a [user acc
 Then set an environment variable with the token and another for a directory to download the models:
 
 ```bash
-export HUGGINGFACEHUB_API_TOKEN=<your-HF-token>
+export HF_TOKEN=<your-HF-token>
 export HF_CACHE_DIR=<directory-where-llms-are-downloaded> #  to avoid redownloading models
 ```
 
 
@@ -170,7 +170,7 @@ Use AMD GPU driver utilities to determine the correct `cardN` and `renderN` IDs
 ### Replace the string 'server_address' with your local server IP address
 export host_ip='server_address'
 ### Replace the string 'your_huggingfacehub_token' with your HuggingFacehub repository access token.
-export HUGGINGFACEHUB_API_TOKEN='your_huggingfacehub_token'
+export HF_TOKEN='your_huggingfacehub_token'
 ### Replace the string 'your_langchain_api_key' with your LANGCHAIN API KEY.
 export LANGCHAIN_API_KEY='your_langchain_api_key'
 export LANGCHAIN_TRACING_V2=""
 
@@ -13,8 +13,8 @@ services:
       http_proxy: ${http_proxy}
       https_proxy: ${https_proxy}
       TGI_LLM_ENDPOINT: "http://${ip_address}:${TGI_SERVICE_PORT}"
-      HUGGING_FACE_HUB_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
-      HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
+      HUGGING_FACE_HUB_TOKEN: ${HF_TOKEN}
+      HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN}
     shm_size: 32g
     devices:
       - /dev/kfd:/dev/kfd
@@ -42,7 +42,7 @@ services:
       with_memory: false
       recursion_limit: ${recursion_limit_worker}
       llm_engine: tgi
-      HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
+      HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN}
       llm_endpoint_url: ${LLM_ENDPOINT_URL}
       model: ${LLM_MODEL_ID}
       temperature: ${temperature}
@@ -76,7 +76,7 @@ services:
       use_hints: false
       recursion_limit: ${recursion_limit_worker}
       llm_engine: vllm
-      HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
+      HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN}
       llm_endpoint_url: ${LLM_ENDPOINT_URL}
       model: ${LLM_MODEL_ID}
       temperature: ${temperature}
@@ -104,7 +104,7 @@ services:
       with_memory: true
       recursion_limit: ${recursion_limit_supervisor}
       llm_engine: tgi
-      HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
+      HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN}
       llm_endpoint_url: ${LLM_ENDPOINT_URL}
       model: ${LLM_MODEL_ID}
       temperature: ${temperature}
 
@@ -10,8 +10,8 @@ services:
       no_proxy: ${no_proxy}
       http_proxy: ${http_proxy}
       https_proxy: ${https_proxy}
-      HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
-      HF_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
+      HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN}
+      HF_TOKEN: ${HF_TOKEN}
       HF_HUB_DISABLE_PROGRESS_BARS: 1
       HF_HUB_ENABLE_HF_TRANSFER: 0
       WILM_USE_TRITON_FLASH_ATTENTION: 0
@@ -46,7 +46,7 @@ services:
       with_memory: false
       recursion_limit: ${recursion_limit_worker}
       llm_engine: vllm
-      HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
+      HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN}
       llm_endpoint_url: ${LLM_ENDPOINT_URL}
       model: ${LLM_MODEL_ID}
       temperature: ${temperature}
@@ -80,7 +80,7 @@ services:
       use_hints: false
       recursion_limit: ${recursion_limit_worker}
       llm_engine: vllm
-      HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
+      HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN}
       llm_endpoint_url: ${LLM_ENDPOINT_URL}
       model: ${LLM_MODEL_ID}
       temperature: ${temperature}
@@ -108,7 +108,7 @@ services:
       with_memory: true
       recursion_limit: ${recursion_limit_supervisor}
       llm_engine: vllm
-      HUGGINGFACEHUB_API_TOKEN: ${HUGGINGFACEHUB_API_TOKEN}
+      HUGGINGFACEHUB_API_TOKEN: ${HF_TOKEN}
       llm_endpoint_url: ${LLM_ENDPOINT_URL}
       model: ${LLM_MODEL_ID}
       temperature: ${temperature}
 
@@ -1,9 +1,10 @@
+#!/bin/bash
 # Copyright (C) 2024 Advanced Micro Devices, Inc.
 # SPDX-License-Identifier: Apache-2.0
 
 # Before start script:
 # export host_ip="your_host_ip_or_host_name"
-# export HUGGINGFACEHUB_API_TOKEN="your_huggingface_api_token"
+# export HF_TOKEN="your_huggingface_api_token"
 # export LANGCHAIN_API_KEY="your_langchain_api_key"
 # export LANGCHAIN_TRACING_V2=""
 
@@ -19,7 +20,7 @@ export CRAG_SERVER_PORT="18114"
 
 export WORKPATH=$(dirname "$PWD")
 export WORKDIR=${WORKPATH}/../../../
-export HUGGINGFACEHUB_API_TOKEN=${HUGGINGFACEHUB_API_TOKEN}
+export HF_TOKEN=${HF_TOKEN}
 export LLM_MODEL_ID="Intel/neural-chat-7b-v3-3"
 export HF_CACHE_DIR="./data"
 export MODEL_CACHE="./data"
@@ -39,7 +40,7 @@ export CRAG_SERVER=http://${ip_address}:${CRAG_SERVER_PORT}
 export WORKER_AGENT_URL="http://${ip_address}:${WORKER_RAG_AGENT_PORT}/v1/chat/completions"
 export SQL_AGENT_URL="http://${ip_address}:${WORKER_SQL_AGENT_PORT}/v1/chat/completions"
 export HF_CACHE_DIR=${HF_CACHE_DIR}
-export HUGGINGFACEHUB_API_TOKEN=${HUGGINGFACEHUB_API_TOKEN}
+export HF_TOKEN=${HF_TOKEN}
 export no_proxy=${no_proxy}
 export http_proxy=${http_proxy}
 export https_proxy=${https_proxy}
Original file line number	Diff line number	Diff line change
`@@ -1,3 +1,4 @@`
	`1`	`+#!/bin/bash`
`1`	`2`	`# Copyright (C) 2024 Intel Corporation`
`2`	`3`	`# SPDX-License-Identifier: Apache-2.0`
`3`	`4`	`#`