Add sample inference configs for HuggingFaceTB/SmolVLM-Instruct (#1703)

nikg4 · web-flow · commit b206d6c5a5f8 · 2025-05-29T15:09:32.000-07:00
diff --git a/configs/recipes/vision/smolvlm/inference/infer.yaml b/configs/recipes/vision/smolvlm/inference/infer.yaml
@@ -0,0 +1,27 @@
+# SmolVLM Instruct inference config.
+#
+# Requirements:
+#   - Run `pip install oumi[gpu]`
+#
+# Usage:
+#   oumi infer -i -c configs/recipes/vision/smolvlm/inference/infer.yaml \
+#     --image "tests/testdata/images/the_great_wave_off_kanagawa.jpg"
+#
+# See Also:
+#   - Documentation: https://oumi.ai/docs/en/latest/user_guides/infer/infer.html
+#   - Config class: oumi.core.configs.InferenceConfig
+#   - Config source: https://github.com/oumi-ai/oumi/blob/main/src/oumi/core/configs/inference_config.py
+#   - Other inference configs: configs/**/inference/
+
+model:
+  model_name: "HuggingFaceTB/SmolVLM-Instruct"
+  torch_dtype_str: "bfloat16"
+  model_max_length: 3072
+  chat_template: "llava"
+  trust_remote_code: True
+
+generation:
+  max_new_tokens: 32
+  batch_size: 1
+
+engine: NATIVE
diff --git a/configs/recipes/vision/smolvlm/inference/vllm_infer.yaml b/configs/recipes/vision/smolvlm/inference/vllm_infer.yaml
@@ -0,0 +1,27 @@
+# vLLM inference config for SmolVLM Instruct.
+#
+# Requirements:
+#   - Run `pip install oumi[gpu]`
+#
+# Usage:
+#   oumi infer -i -c configs/recipes/vision/smolvlm/inference/vllm_infer.yaml \
+#     --image "tests/testdata/images/the_great_wave_off_kanagawa.jpg"
+#
+# See Also:
+#   - Documentation: https://oumi.ai/docs/en/latest/user_guides/infer/infer.html
+#   - Config class: oumi.core.configs.InferenceConfig
+#   - Config source: https://github.com/oumi-ai/oumi/blob/main/src/oumi/core/configs/inference_config.py
+#   - Other inference configs: configs/**/inference/
+
+model:
+  model_name: "HuggingFaceTB/SmolVLM-Instruct"
+  torch_dtype_str: "bfloat16"
+  model_max_length: 3072
+  chat_template: "llava"
+  trust_remote_code: True
+
+generation:
+  max_new_tokens: 32
+  batch_size: 1
+
+engine: VLLM