diff --git a/docker-compose.components.yml b/docker-compose.components.yml index d2e530a9..0069489a 100644 --- a/docker-compose.components.yml +++ b/docker-compose.components.yml @@ -114,7 +114,6 @@ services: # Optionally, limit the GPUs exposed to the server. # At least one GPU is required to run the YOLO TensorRT engine. - NVIDIA_VISIBLE_DEVICES=all - command: [tritonserver, --model-repository=/models, --strict-model-config=false, @@ -221,6 +220,25 @@ services: image: ${REGISTRY}openmpf_ortools_subject_component:${TAG} build: ${OPENMPF_PROJECTS_PATH}/openmpf-components/python/OrToolsSubjectComponent + qwen-speech-summarization: + <<: *component-base + image: ${REGISTRY}openmpf_qwen_speech_summarization:${TAG} + build: ${OPENMPF_PROJECTS_PATH}/openmpf-components/python/QwenSpeechSummarization + + qwen-speech-summarization-server: + image: ${REGISTRY}openmpf_qwen_speech_summarization_server:${TAG} + build: + context: ${OPENMPF_PROJECTS_PATH}/openmpf-components/python/QwenSpeechSummarization + dockerfile: Dockerfile.vllm + deploy: + mode: global + # resources: + # reservations: + # devices: + # - driver: nvidia + # device_ids: ['0'] + # capabilities: [gpu] + scene-change-detection: <<: *component-base image: ${REGISTRY}openmpf_scene_change_detection:${TAG}