Fixing PR conflicts (#2)

couillonnade · web-flow · commit 916355b627cc · 2024-06-27T19:18:19.000+09:00
* Fixing PR conflicts

* fix relative path
diff --git a/.gitignore b/.gitignore
@@ -0,0 +1,8 @@
+phi3v/
+quantized_phi3v/
+adapters/
+*.egg-info
+*.json
+.DS_STORE
+.DS_Store
+__pycache__/
diff --git a/examples/main.py b/examples/main.py
@@ -0,0 +1,37 @@
+''''
+This is a simple example of how to use the Phi-3 Vision MLX agent.
+The agent can be used for Visual Question Answering, Generative Feedback Loop, API Tool Use, and more.
+
+Author: Josef Albers
+
+More examples here: https://github.com/JosefAlbers/Phi-3-Vision-MLX
+'''
+
+import sys
+import os
+
+# Add the parent folder of phi_3_vision_mlx module to the Python module search path
+sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), '..')))
+
+from phi_3_vision_mlx import Agent
+
+# Visual Question Answering (VQA)
+agent = Agent()
+agent('What is shown in this image?', 'https://collectionapi.metmuseum.org/api/collection/v1/iiif/344291/725918/main-image')
+agent.end()
+
+# Generative Feedback Loop
+# The agent can be used to generate code, execute it, and then modify it based on feedback
+
+agent('Plot a Lissajous Curve.')
+agent('Modify the code to plot 3:4 frequency')
+agent.end()
+
+# API Tool Use
+# You can use the agent to create images or generate speech using API calls
+
+agent('Draw "A perfectly red apple, 32k HDR, studio lighting"')
+agent.end()
+agent('Speak "People say nothing is impossible, but I do nothing every day."')
+agent.end()
+
diff --git a/phi_3_vision_mlx.py b/phi_3_vision_mlx.py
@@ -734,7 +734,10 @@ def _apply_chat_template(prompt, images, verbose, apply_chat_template=True):
         img_prompt = ''
     prompt = [prompt] if isinstance(prompt, str) else prompt
     prompt = [f"<|user|>\n{img_prompt}{i}<|end|>\n<|assistant|>\n" for i in prompt]
-    print(f'### Prompt ###\n{"\n".join(map(str.strip, prompt)).strip()}\n### Images ###\n{"\n".join(map(str, images)) if images else "None"}\n### Output ###') if verbose else None
+    if verbose:
+        prompt_str = "\n".join(map(str.strip, prompt)).strip()
+        images_str = "\n".join(map(str, images)) if images else "None"
+        print(f'### Prompt ###\n{prompt_str}\n### Images ###\n{images_str}\n### Output ###')
     prompt = prompt[0] if len(prompt) == 1 else prompt
     return prompt, images