diff --git a/AI-Travel-Agent/requirements.txt b/AI-Travel-Agent/requirements.txt index 885361c..a90e34b 100644 --- a/AI-Travel-Agent/requirements.txt +++ b/AI-Travel-Agent/requirements.txt @@ -2,10 +2,10 @@ amadeus==12.0.0 ipykernel==7.0.1 jupyter==1.1.1 langchain==1.0.2 -langchain-community==0.3.27 +langchain-community==0.4.1 streamlit==1.51.0 huggingface-hub==1.1.4 pydantic==2.12.3 wikipedia==1.4.0 google-search-results==2.4.2 -hf-xet==1.2.0 +hf-xet==1.2.0 \ No newline at end of file diff --git a/LLM/rag/requirements.txt b/LLM/rag/requirements.txt index 1fceec8..e3ba24b 100644 --- a/LLM/rag/requirements.txt +++ b/LLM/rag/requirements.txt @@ -1,12 +1,12 @@ -langchain==0.3.24 +langchain==0.3.27 langchain-community==0.3.27 -langchain-core==0.3.56 +langchain-core==0.3.72 langchain-huggingface==0.1.2 -huggingface-hub==0.29.1 +huggingface-hub>=0.30.0 sentence-transformers==3.4.1 chromadb==0.6.3 transformers==4.53.1 pypdf==6.1.3 torch==2.7.1 langchain-chroma==0.2.2 -beautifulsoup4==4.13.3 +beautifulsoup4==4.13.3 \ No newline at end of file diff --git a/LLM/src/README.md b/LLM/src/README.md new file mode 100644 index 0000000..c9c1422 --- /dev/null +++ b/LLM/src/README.md @@ -0,0 +1,150 @@ +# RAG Chat with Ollama + +A Streamlit-based Retrieval-Augmented Generation (RAG) chat application powered by Ollama on Intel® Core™ Ultra Processors. + +## Overview + +This application demonstrates a RAG (Retrieval-Augmented Generation) system that allows you to chat with documents using Ollama's language models. Upload your documents, and the system will create embeddings and enable semantic search to provide context-aware responses. + +## Prerequisites + +- Windows 11 or Ubuntu 20.04+ +- Intel® Core™ Ultra Processors or Intel Arc™ Graphics +- 16GB+ RAM recommended + +## Setup + +### 1. Install Ollama + +Download and install Ollama: +```powershell +winget install Ollama.Ollama +``` + +Or download from [https://ollama.com/download](https://ollama.com/download) + +### 2. Building Ollama with GPU Support (Vulkan) + +For advanced users who want to build Ollama from source with Vulkan GPU acceleration on Windows: + +**a. Install Vulkan SDK** +- Download from: [https://vulkan.lunarg.com/sdk/home](https://vulkan.lunarg.com/sdk/home) + +**b. Install TDM-GCC** +- Download from: [https://github.com/jmeubank/tdm-gcc/releases/tag/v10.3.0-tdm64-2](https://github.com/jmeubank/tdm-gcc/releases/tag/v10.3.0-tdm64-2) + +**c. Install Go SDK** +- Download Go v1.24.9: [https://go.dev/dl/go1.24.9.windows-amd64.msi](https://go.dev/dl/go1.24.9.windows-amd64.msi) + +**d. Build Ollama with Vulkan** +```powershell +# Set environment variables +set CGO_ENABLED=1 +set CGO_CFLAGS=-IC:\VulkanSDK\1.4.321.1\Include + +# Build with CMake +cmake -B build +cmake --build build --config Release -j14 + +# Build Go binary +go build + +# Run Ollama server (Terminal 1) +go run . serve + +# Test with a model (Terminal 2) +ollama run gemma3:270m +``` + +**Note:** This is for advanced users. The pre-built Ollama installation works fine for most users. + +### 3. Pull Language Models + +Pull the models you want to use: +```bash +ollama pull llama3.2 +ollama pull qwen2.5 +ollama pull mistral +``` + +### 4. Install Python Dependencies + +Using pip: +```bash +pip install streamlit ollama chromadb sentence-transformers pypdf +``` + +Using uv (recommended): +```bash +uv pip install streamlit ollama chromadb sentence-transformers pypdf +``` + +## Running the Application + +### 1. Start Ollama Server + +If not already running: +```bash +ollama serve +``` + +### 2. Run the Streamlit App + +```bash +# Using Python directly +streamlit run st_rag_chat.py + +# Or using uv +uv run streamlit run st_rag_chat.py +``` + +### 3. Access the App + +Open your browser and navigate to: +``` +http://localhost:8501 +``` + +## Usage + +1. **Upload Documents**: Use the sidebar to upload PDF or text files +2. **Select Model**: Choose your preferred Ollama model from the dropdown +3. **Process Documents**: Click "Process Documents" to create embeddings +4. **Chat**: Ask questions about your documents in the chat interface +5. **View Sources**: See which document sections were used to answer your questions + +## Features + +- 📄 **Multi-format Support**: Upload PDF and text documents +- 🤖 **Model Selection**: Choose from available Ollama models +- 🔍 **Semantic Search**: Find relevant context using vector embeddings +- 💬 **Context-Aware Chat**: Get answers based on your documents +- 📚 **Source Attribution**: See which parts of documents were used +- 💾 **Persistent Storage**: ChromaDB vector database for efficient retrieval + +## Troubleshooting + +**Ollama Connection Error:** +- Ensure Ollama is running: `ollama serve` +- Check if models are installed: `ollama list` + +**Memory Issues:** +- Use smaller models like `llama3.2:1b` or `qwen2.5:3b` +- Reduce the number of documents processed at once + +**Slow Performance:** +- Ensure GPU drivers are up to date +- Use GPU-accelerated Ollama build (Vulkan) +- Try smaller, faster models + +## Technical Stack + +- **Ollama**: Local LLM runtime +- **Streamlit**: Web interface +- **ChromaDB**: Vector database +- **Sentence Transformers**: Text embeddings +- **Intel Hardware**: Optimized for Intel Core™ Ultra Processors + +## License + +This project is licensed under the MIT License. diff --git a/LLM/src/st_ollama.py b/LLM/src/st_ollama.py index f704eb1..90335a5 100644 --- a/LLM/src/st_ollama.py +++ b/LLM/src/st_ollama.py @@ -13,7 +13,8 @@ def load_models(): list: A list of model names if successful, otherwise an empty list. """ try: - model_list = [model["name"] for model in ollama.list()["models"]] + response = ollama.list() + model_list = [model.model for model in response.models] return model_list except Exception as e: st.error(f"Error loading models: {e}") diff --git a/LLM/src/st_rag_chat.py b/LLM/src/st_rag_chat.py new file mode 100644 index 0000000..5b2b69f --- /dev/null +++ b/LLM/src/st_rag_chat.py @@ -0,0 +1,431 @@ +from langchain.chains import RetrievalQA +from langchain.text_splitter import RecursiveCharacterTextSplitter +from langchain_core.prompts import PromptTemplate +from langchain_community.embeddings.fastembed import FastEmbedEmbeddings +from langchain_community import document_loaders, embeddings, vectorstores, llms +from langchain_community.document_loaders import DirectoryLoader, TextLoader +from langchain_community.document_loaders.pdf import PyPDFLoader +import streamlit as st +import time +import os +import warnings +import ollama +import hashlib + +warnings.filterwarnings("ignore") + +OLLAMA_BASE_URL = "http://localhost:11434" + +st.header("LLM RAG Chat Interface 🐻‍❄️💬") + +# Initialize session state for chat history +if "messages" not in st.session_state: + st.session_state.messages = [] +if "vector_store" not in st.session_state: + st.session_state.vector_store = None +if "current_document" not in st.session_state: + st.session_state.current_document = None + +response = ollama.list() +models = [model.model for model in response.models] +model = st.selectbox("Choose a model from the list", models) + +# Select source type +source_type = st.selectbox( + "Select document source:", + ("URL", "Local File from Data Folder"), + key="source_type" +) + +if source_type == "URL": + # Input text to load the document from URL + source_path = st.text_input("Enter the URL to load for RAG:", key="url_path") +else: + # Show available files in data folder + current_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__))) # Go up to LLM folder + data_dir = os.path.join(current_dir, "data") + if os.path.exists(data_dir): + files = [f for f in os.listdir(data_dir) if f.endswith(('.txt', '.pdf', '.md'))] + if files: + st.write("Available files in data folder:") + source_path = st.selectbox("Select a file:", files, key="file_selection") + st.info(f"Selected file: {source_path}") + else: + st.warning("No supported files (.txt, .pdf, .md) found in data folder") + source_path = None + else: + st.error("Data folder not found. Please create a 'data' folder in the parent directory and add your files.") + source_path = None + +# Select embedding type +embedding_type = st.selectbox( + "Please select an embedding type", + ("ollama", + "huggingface", + "nomic", + "fastembed"), + index=1) + + +def load_document(source_path, source_type="URL"): + """ + Load the document from the specified URL or local file. + + Args: + source_path (str): The URL or filename of the document to load. + source_type (str): Either "URL" or "Local File from Data Folder" + + Returns: + Document: The loaded document. + """ + if source_type == "URL": + print("Loading document from URL...") + st.markdown(''' :green[Loading document from URL...] ''') + loader = document_loaders.WebBaseLoader(source_path) + return loader.load() + else: + # Load from local file in data folder + current_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__))) # Go up to LLM folder + data_dir = os.path.join(current_dir, "data") + full_path = os.path.join(data_dir, source_path) + + if not os.path.exists(full_path): + raise FileNotFoundError(f"File not found: {full_path}") + + print(f"Loading document from: {full_path}") + st.markdown(f''' :green[Loading document from: {full_path}] ''') + + if source_path.endswith('.pdf'): + loader = PyPDFLoader(full_path) + else: + loader = TextLoader(full_path, encoding='utf-8') + + return loader.load() + + +def split_document(text, chunk_size=3000, overlap=200): + """ + Split the document into multiple chunks. + + Args: + text (str): The text of the document to split. + chunk_size (int): The size of each chunk. + overlap (int): The overlap between chunks. + + Returns: + list: A list of document chunks. + """ + print("Splitting document into chunks...") + st.markdown(''' :green[Splitting document into chunks...] ''') + text_splitter_instance = RecursiveCharacterTextSplitter( + chunk_size=chunk_size, chunk_overlap=overlap) + return text_splitter_instance.split_documents(text) + + +def initialize_embedding_fn( + embedding_type="huggingface", + model_name="sentence-transformers/all-MiniLM-l6-v2"): + """ + Initialize the embedding function based on the specified type. + + Args: + embedding_type (str): The type of embedding to use. + model_name (str): The name of the model to use for embeddings. + + Returns: + Embeddings: The initialized embedding function. + """ + print(f"Initializing {embedding_type} model with {model_name}...") + st.write(f"Initializing {embedding_type} model with {model_name}...") + if embedding_type == "ollama": + model_name = chat_model + return embeddings.OllamaEmbeddings( + model=model_name, base_url=OLLAMA_BASE_URL) + elif embedding_type == "huggingface": + model_name = "sentence-transformers/paraphrase-MiniLM-L3-v2" + return embeddings.HuggingFaceEmbeddings(model_name=model_name) + elif embedding_type == "nomic": + return embeddings.NomicEmbeddings(model_name=model_name) + elif embedding_type == "fastembed": + return FastEmbedEmbeddings(threads=16) + else: + raise ValueError(f"Unsupported embedding type: {embedding_type}") + + +def get_or_create_embeddings(document_url, source_type, embedding_fn): + """ + Create embeddings for the document chunks and store them in a vector database. + Uses persistent storage with improved caching that considers embedding type. + + Args: + document_url (str): The URL of the document. + source_type (str): The type of source (URL or local file). + embedding_fn (Embeddings): The embedding function to use. + + Returns: + VectorStore: The created or loaded vector store. + """ + # Create a more specific hash for caching that includes embedding type + embedding_type_name = embedding_fn.__class__.__name__ + cache_key = f"{document_url}_{source_type}_{embedding_type_name}" + source_hash = hashlib.md5(cache_key.encode()).hexdigest() + persist_directory = f"./chroma_db/{source_hash}" + + print(f"Cache key: {cache_key}") + print(f"Cache directory: {persist_directory}") + + # Check if embeddings already exist and are for the same document + if os.path.exists(persist_directory): + # Check if there's a metadata file to verify this is the right document + metadata_file = os.path.join(persist_directory, "document_info.txt") + if os.path.exists(metadata_file): + with open(metadata_file, 'r', encoding='utf-8') as f: + cached_info = f.read().strip() + if cached_info == cache_key: + print(f"Loading existing embeddings from: {persist_directory}") + st.markdown(f''' :orange[Loading cached embeddings for: {source_type}: {document_url}] ''') + try: + vector_store = vectorstores.Chroma( + persist_directory=persist_directory, + embedding_function=embedding_fn + ) + return vector_store + except Exception as e: + print(f"Error loading cached embeddings: {e}") + st.warning("Error loading cached embeddings, creating new ones...") + else: + print(f"Cache mismatch. Expected: {cache_key}, Found: {cached_info}") + st.warning("Cache mismatch detected, creating new embeddings...") + else: + print("No metadata file found, creating new embeddings...") + st.warning("Cache metadata missing, creating new embeddings...") + + # Create new embeddings + start_time = time.time() + print(f"Creating new embeddings for: {document_url}") + st.markdown(f''' :green[Creating new embeddings for: {source_type}: {document_url}] ''') + + # Clean up the directory if it exists but has issues + if os.path.exists(persist_directory): + import shutil + shutil.rmtree(persist_directory) + + document = load_document(document_url, source_type) + documents = split_document(document) + + vector_store = vectorstores.Chroma.from_documents( + documents=documents, + embedding=embedding_fn, + persist_directory=persist_directory + ) + + # Save metadata to verify cache validity + os.makedirs(persist_directory, exist_ok=True) + metadata_file = os.path.join(persist_directory, "document_info.txt") + with open(metadata_file, 'w', encoding='utf-8') as f: + f.write(cache_key) + + print(f"Embedding time: {time.time() - start_time:.2f} seconds") + st.write(f"Embedding time: {time.time() - start_time:.2f} seconds") + return vector_store + + +def get_chat_context(): + """ + Build context from previous messages for continuity + """ + if not st.session_state.messages: + return "" + + # Get last few messages for context (limit to avoid token overflow) + recent_messages = st.session_state.messages[-6:] # Last 3 Q&A pairs + context_parts = [] + + for msg in recent_messages: + if msg["role"] == "user": + context_parts.append(f"Previous Question: {msg['content']}") + else: + context_parts.append(f"Previous Answer: {msg['content']}") + + return "\n".join(context_parts) + + +def handle_chat_query(vector_store, chat_model, question): + """ + Handle chat query with context awareness + """ + # Get conversation context + chat_context = get_chat_context() + + # Create enhanced question with chat context if available + if chat_context: + enhanced_question = f""" +Previous conversation context: +{chat_context} + +Current question: {question} +""" + else: + enhanced_question = question + + # Simple prompt template that only uses context and question + prompt_template = """ + Use the following pieces of context to answer the question at the end. + If you do not know the answer, answer 'I don't know', limit your response to the answer and nothing more. + + {context} + + Question: {question} + """ + + prompt = PromptTemplate( + template=prompt_template, + input_variables=["context", "question"] + ) + + chain_type_kwargs = {"prompt": prompt} + retriever = vector_store.as_retriever(search_kwargs={"k": 4}) + + qachain = RetrievalQA.from_chain_type( + llm=chat_model, + retriever=retriever, + chain_type="stuff", + chain_type_kwargs=chain_type_kwargs + ) + + start_time = time.time() + answer = qachain.invoke({"query": enhanced_question}) + print(f"Response time: {time.time() - start_time:.2f} seconds") + + return answer['result'] + + +# Load document section +st.write("### 📄 Document Loading") +load_button = st.button("Load Document", type="primary") + +if load_button: + if not source_path or not source_path.strip(): + st.error("Please select/enter a valid source.") + else: + with st.spinner("Loading document and creating embeddings..."): + try: + embedding_fn = initialize_embedding_fn(embedding_type) + vector_store = get_or_create_embeddings(source_path, source_type, embedding_fn) + + # Proper warmup: initialize the model and retriever chain + st.markdown(''' :green[Initializing RAG system...] ''') + chat_model_instance = llms.Ollama(base_url=OLLAMA_BASE_URL, model=model) + + # Warmup the retriever + retriever = vector_store.as_retriever(search_kwargs={"k": 4}) + warmup_docs = retriever.get_relevant_documents("document content summary") + + # Warmup the QA chain with actual query + prompt_template = """ + Use the following pieces of context to answer the question at the end. + If you do not know the answer, answer 'I don't know', limit your response to the answer and nothing more. + + {context} + + Question: {question} + """ + prompt = PromptTemplate( + template=prompt_template, + input_variables=["context", "question"] + ) + chain_type_kwargs = {"prompt": prompt} + + warmup_chain = RetrievalQA.from_chain_type( + llm=chat_model_instance, + retriever=retriever, + chain_type="stuff", + chain_type_kwargs=chain_type_kwargs + ) + + # Execute warmup query + warmup_chain.invoke({"query": "What is this document about?"}) + + st.session_state.vector_store = vector_store + st.session_state.current_document = f"{source_type}: {source_path}" + + # Clear previous chat and add initial summary request + st.session_state.messages = [] + st.session_state.messages.append({ + "role": "user", + "content": "Summarize this document" + }) + + # Generate the summary automatically + st.markdown(''' :green[Generating document summary...] ''') + summary = handle_chat_query( + st.session_state.vector_store, + chat_model_instance, + "Summarize this document" + ) + st.session_state.messages.append({ + "role": "assistant", + "content": summary + }) + + st.success(f"✅ Document loaded successfully!") + st.info(f"Loaded: {st.session_state.current_document}") + st.rerun() + except Exception as e: + st.error(f"Error loading document: {e}") + +# Display current document status +if st.session_state.current_document: + st.write(f"📄 **Current Document**: {st.session_state.current_document}") +else: + st.warning("⚠️ No document loaded. Please load a document first.") + +# Chat Interface +st.write("### 💬 Chat Interface") + +# Display chat messages +for message in st.session_state.messages: + with st.chat_message(message["role"]): + st.markdown(message["content"]) + +# Chat input +if question := st.chat_input("Ask a question about the document..."): + if not st.session_state.vector_store: + st.error("Please load a document first!") + else: + # Add user message to chat history + st.session_state.messages.append({"role": "user", "content": question}) + + # Display user message + with st.chat_message("user"): + st.markdown(question) + + # Generate response + with st.chat_message("assistant"): + with st.spinner("Thinking..."): + try: + chat_model_instance = llms.Ollama( + base_url=OLLAMA_BASE_URL, model=model) + response = handle_chat_query( + st.session_state.vector_store, + chat_model_instance, + question + ) + st.markdown(response) + + # Add assistant response to chat history + st.session_state.messages.append({"role": "assistant", "content": response}) + + except Exception as e: + error_msg = f"Error generating response: {str(e)}" + st.error(error_msg) + st.session_state.messages.append({"role": "assistant", "content": error_msg}) + +# Clear chat button +if st.button("🗑️ Clear Chat History"): + st.session_state.messages = [] + st.rerun() + +# Display chat statistics +if st.session_state.messages: + st.write(f"💬 **Chat History**: {len(st.session_state.messages)} messages") \ No newline at end of file diff --git a/LLM/src/st_rag_chromadb.py b/LLM/src/st_rag_chromadb.py deleted file mode 100644 index 0b41f56..0000000 --- a/LLM/src/st_rag_chromadb.py +++ /dev/null @@ -1,219 +0,0 @@ -from langchain import chains, text_splitter, PromptTemplate -from langchain_community.embeddings.fastembed import FastEmbedEmbeddings -from langchain_community import document_loaders, embeddings, vectorstores, llms -import streamlit as st -import time -import os -import warnings -import ollama - -warnings.filterwarnings("ignore") - -OLLAMA_BASE_URL = "http://localhost:11434" -VECTOR_DB_DIR = "vector_dbs" - -st.header("LLM Rag 🐻‍❄️") - -models = [model["name"] for model in ollama.list()["models"]] -model = st.selectbox("Choose a model from the list", models) - -# Input text to load the document -url_path = st.text_input("Enter the URL to load for RAG:", key="url_path") - -# Select embedding type -embedding_type = st.selectbox( - "Please select an embedding type", - ("ollama", - "huggingface", - "nomic", - "fastembed"), - index=1) - -# Input for RAG -question = st.text_input( - "Enter the question for RAG:", - value="What is this about", - key="question") - - -def load_document(url): - """ - Load the document from the specified URL. - - Args: - url (str): The URL of the document to load. - - Returns: - Document: The loaded document. - """ - print("Loading document from URL...") - st.markdown(''' :green[Loading document from URL...] ''') - loader = document_loaders.WebBaseLoader(url) - return loader.load() - - -def split_document(text, chunk_size=3000, overlap=200): - """ - Split the document into multiple chunks. - - Args: - text (str): The text of the document to split. - chunk_size (int): The size of each chunk. - overlap (int): The overlap between chunks. - - Returns: - list: A list of document chunks. - """ - print("Splitting document into chunks...") - st.markdown(''' :green[Splitting document into chunks...] ''') - text_splitter_instance = text_splitter.RecursiveCharacterTextSplitter( - chunk_size=chunk_size, chunk_overlap=overlap) - return text_splitter_instance.split_documents(text) - - -def initialize_embedding_fn( - embedding_type="huggingface", - model_name="sentence-transformers/all-MiniLM-l6-v2"): - """ - Initialize the embedding function based on the specified type. - - Args: - embedding_type (str): The type of embedding to use. - model_name (str): The name of the model to use for embeddings. - - Returns: - Embeddings: The initialized embedding function. - """ - print(f"Initializing {embedding_type} model with {model_name}...") - st.write(f"Initializing {embedding_type} model with {model_name}...") - if embedding_type == "ollama": - model_name = chat_model - return embeddings.OllamaEmbeddings( - model=model_name, base_url=OLLAMA_BASE_URL) - elif embedding_type == "huggingface": - model_name = "sentence-transformers/paraphrase-MiniLM-L3-v2" - return embeddings.HuggingFaceEmbeddings(model_name=model_name) - elif embedding_type == "nomic": - return embeddings.NomicEmbeddings(model_name=model_name) - elif embedding_type == "fastembed": - return FastEmbedEmbeddings(threads=16) - else: - raise ValueError(f"Unsupported embedding type: {embedding_type}") - - -def get_or_create_embeddings( - document_url, - embedding_fn, - persist_dir=VECTOR_DB_DIR): - """ - Create embeddings for the document chunks and store them in a vector database. - - Args: - document_url (str): The URL of the document. - embedding_fn (Embeddings): The embedding function to use. - persist_dir (str): The directory to persist the vector database. - - Returns: - VectorStore: The created vector store. - """ - vector_store_path = os.path.join(os.getcwd(), persist_dir) - start_time = time.time() - print("No existing vector store found. Creating new one...") - st.markdown( - ''' :green[No existing vector store found. Creating new one......] ''') - document = load_document(document_url) - documents = split_document(document) - vector_store = vectorstores.Chroma.from_documents( - documents=documents, - embedding=embedding_fn, - persist_directory=persist_dir - ) - vector_store.persist() - print(f"Embedding time: {time.time() - start_time:.2f} seconds") - st.write(f"Embedding time: {time.time() - start_time:.2f} seconds") - return vector_store - - -def handle_user_interaction(vector_store, chat_model): - """ - Handle user interaction by generating a response based on the user's question. - - Args: - vector_store (VectorStore): The vector store containing document embeddings. - chat_model (LLM): The language model to generate responses. - - Returns: - str: The generated response. - """ - prompt_template = """ - Use the following pieces of context to answer the question at the end. - If you do not know the answer, answer 'I don't know', limit your response to the answer and nothing more. - - {context} - - Question: {question} - """ - prompt = PromptTemplate( - template=prompt_template, - input_variables=[ - "context", - "question"]) - chain_type_kwargs = {"prompt": prompt} - st.markdown( - ''' :green[Using retrievers to retrieve the data from the database...] ''') - retriever = vector_store.as_retriever(search_kwargs={"k": 4}) - st.markdown(''' :green[Answering the query...] ''') - qachain = chains.RetrievalQA.from_chain_type( - llm=chat_model, - retriever=retriever, - chain_type="stuff", - chain_type_kwargs=chain_type_kwargs) - qachain.invoke({"query": "what is this about?"}) - print(f"Model warmup complete...") - st.markdown(''' :green[Model warmup complete...] ''') - - start_time = time.time() - answer = qachain.invoke({"query": question}) - print(f"Answer: {answer['result']}") - print(f"Response time: {time.time() - start_time:.2f} seconds") - st.write(f"Response time: {time.time() - start_time:.2f} seconds") - - return answer['result'] - - -def getfinalresponse(document_url, embedding_type, chat_model): - """ - Main function to load the document, initialize the embeddings, create the vector database, and invoke the model. - - Args: - document_url (str): The URL of the document. - embedding_type (str): The type of embedding to use. - chat_model (str): The name of the chat model to use. - - Returns: - str: The final response generated by the model. - """ - try: - document_url = url_path - chat_model = model - - embedding_fn = initialize_embedding_fn(embedding_type) - vector_store = get_or_create_embeddings(document_url, embedding_fn) - chat_model_instance = llms.Ollama( - base_url=OLLAMA_BASE_URL, model=chat_model) - return handle_user_interaction(vector_store, chat_model_instance) - except Exception as e: - st.error(f"An error occurred: {e}") - return None - - -submit = st.button("Generate") - -if submit: - if not url_path.strip(): - st.error("Please enter a valid URL.") - elif not question.strip(): - st.error("Please enter a valid question.") - else: - with st.spinner("Loading document....🐎"): - st.write(getfinalresponse(url_path, embedding_type, model)) diff --git a/Video-Description-Generation-Query-Retrieval/Readme.md b/Video-Description-Generation-Query-Retrieval/Readme.md index 13f976e..16fd9d7 100644 --- a/Video-Description-Generation-Query-Retrieval/Readme.md +++ b/Video-Description-Generation-Query-Retrieval/Readme.md @@ -1,10 +1,17 @@ -# Video Description Generation and Query Retrieval +# Video Description Generation and Query Retrieval with Ollama ## Introduction -This sample demonstrates how to generate video descriptions using the [**Qwen 2.5 Vision-Language model**](https://github.com/QwenLM/Qwen2.5-VL) and store their embeddings in [**ChromaDB**](https://www.trychroma.com/) for efficient semantic search on **Intel® Core™ Ultra Processors**. The Qwen 2.5 Vision-Language model is loaded using the [**PyTorch XPU backend**](https://docs.pytorch.org/docs/stable/notes/get_start_xpu.html) to leverage Intel hardware acceleration.\ -For each video, a description is generated and stored as an embedding in ChromaDB. When a user submits a query, cosine similarity search is performed in ChromaDB to retrieve the most relevant video description. The matching video is then displayed inline.\ +This sample demonstrates how to generate video descriptions using [**Ollama**](https://ollama.ai) vision models and store their embeddings in [**ChromaDB**](https://www.trychroma.com/) for efficient semantic search on **Intel® Core™ Ultra Processors** and **Intel® Arc™ Graphics**. + +Ollama provides an optimized runtime for vision-language models (Qwen 2.5 VL, Llama 3.2 Vision, LLaVA) with simplified deployment on Intel GPUs. For each video, a description is generated and stored as an embedding in ChromaDB. When a user submits a query, cosine similarity search is performed in ChromaDB to retrieve the most relevant video description. + This sample uses the videos from the [**stepfun-ai/Step-Video-T2V-Eval**](https://huggingface.co/datasets/stepfun-ai/Step-Video-T2V-Eval) Hugging Face dataset. For more information on the dataset and citation requirements, please refer to the [**Step-Video-T2V Technical Report paper**](https://arxiv.org/abs/2502.10248). +### Available Interfaces: + +- `Video_RAG_Ollama.ipynb` - Jupyter notebook implementation +- `st_video_rag_demo.py` - Streamlit web interface + --- ## Table of Contents @@ -25,12 +32,59 @@ This sample uses the videos from the [**stepfun-ai/Step-Video-T2V-Eval**](https: ## Architecture -- During the initial data load, videos from the [Step-Video-T2V-Eval](https://huggingface.co/datasets/stepfun-ai/Step-Video-T2V-Eval) Hugging Face dataset is fed into the [Qwen 2.5 Vision-Language model](https://github.com/QwenLM/Qwen2.5-VL). -- Here, the [Qwen2.5-VL-3B-Instruct](https://huggingface.co/Qwen/Qwen2.5-VL-3B-Instruct) model variant is used to process these videos and generate descriptions. The Qwen 2.5 Vision-Language model is loaded using the [PyTorch XPU backend](https://docs.pytorch.org/docs/stable/notes/get_start_xpu.html) to leverage Intel hardware acceleration. -- Next, the generated video descriptions are converted into embeddings using [Sentence Transformers](https://sbert.net/), with the [all-MiniLM-L6-v2 model](https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2). -- These embeddings, along with the descriptions and video metadata, are stored in a persistent local [ChromaDB](https://www.trychroma.com/) collection. This is a one-time operation; since ChromaDB is local and persistent, it does not need to be repeated unless new videos are added. -- When a user submits a query, the text is similarly encoded into an embedding, which is then used to perform a semantic search (via cosine similarity) over the ChromaDB collection. -- The final result will be the most relevant video description and its associated video file name, and the video is displayed directly in the notebook. +### System Workflow + +``` +┌─────────────────────────────────────────────────────────────────────┐ +│ VIDEO PROCESSING PIPELINE │ +└─────────────────────────────────────────────────────────────────────┘ + +Video Files ──► Frame Extraction ──► Ollama Vision Model ──► Text Descriptions + │ + │ (Accelerated by Intel GPUs) + ▼ + Sentence Transformer ──► ChromaDB Storage + │ +┌─────────────────────────────────────────────────────────────┘ +│ SEARCH PIPELINE +└─────────────────────────────────────────────────────────────────────┐ + │ +User Query ──► Query Embedding ──► Cosine Similarity ◄────────────────┘ + │ + ▼ + Ranked Results ──► Display Videos + +┌─────────────────────────────────────────────────────────────────────┐ +│ Hardware: Intel Arc™ Graphics | Core™ Ultra | Iris® Xe Graphics │ +└─────────────────────────────────────────────────────────────────────┘ +``` + +### Workflow Details + +**Video Processing Pipeline:** + +1. **Video Input**: Videos from [Step-Video-T2V-Eval](https://huggingface.co/datasets/stepfun-ai/Step-Video-T2V-Eval) dataset +2. **Frame Extraction**: Representative frames extracted using OpenCV +3. **Vision Model**: Ollama runtime with Qwen 2.5 VL, Llama 3.2 Vision, or LLaVA on Intel GPU +4. **Description Generation**: Detailed text descriptions of video content +5. **Embedding Creation**: Text → vector embeddings via [Sentence Transformers](https://sbert.net/) ([all-MiniLM-L6-v2](https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2)) +6. **Storage**: Embeddings + metadata stored in [ChromaDB](https://www.trychroma.com/) vector database + +**Search Pipeline:** + +1. **User Query**: Natural language text input (e.g., "person playing basketball") +2. **Query Embedding**: Convert query to vector using same embedding model +3. **Similarity Search**: Cosine similarity search over ChromaDB collection +4. **Ranked Results**: Return top matching videos with similarity scores +5. **Display**: Show videos with descriptions and match quality + +**Intel Hardware Optimization:** + +- **Intel Arc™ Graphics**: GPU acceleration for vision model inference +- **Intel Core™ Ultra Processors**: Optimized CPU performance +- **Intel Iris® Xe Graphics**: Integrated graphics acceleration +- **Local Processing**: No cloud dependency, all computation on-device +- **Ollama Runtime**: Optimized for Intel hardware ![How it works](./assets/Video_description_generation_and_query_retrieval_workflow.png) @@ -39,14 +93,15 @@ This sample uses the videos from the [**stepfun-ai/Step-Video-T2V-Eval**](https: ## Project Structure Video-Description-Generation-Query-Retrieval/ # Project Sample folder - ├── assets/ # Assets folder which contains the images and diagrams - │ ├── Generating_video_descriptions_using_Pytorch_XPU.png # Output screenshot image 1 - │ ├── Video_description_generation_and_query_retrieval_workflow.jpg # Workflow image - │ └── Video_display.png # Output screenshot image 2 - ├── Readme.md # Readme file which contains all the details and instructions about the project sample - ├── Video_Description_Generation_Query_Retrieval.ipynb # Notebook file to excute the project sample - ├── pyproject.toml # Requirements for the project sample - └── uv.lock # File which captures the packages installed for the project sample + ├── assets/ # Assets folder with images and diagrams + │ ├── Generating_video_descriptions_using_Pytorch_XPU.png # PyTorch XPU output screenshot + │ ├── Video_description_generation_and_query_retrieval_workflow.jpg # Workflow diagram + │ └── Video_display.png # Video display screenshot + ├── Readme.md # Main README + ├── Video_RAG_Ollama.ipynb # Ollama-based notebook + ├── st_video_rag_demo.py # Streamlit web interface + ├── pyproject.toml # UV/pip requirements + └── uv.lock # UV lock file --- @@ -81,33 +136,79 @@ Please find the some of the keywords below used in the prompts across 11 differe ### For Windows: To install any software using commands, Open the Command Prompt as an administrator by right-clicking the terminal icon and selecting `Run as administrator`. + 1. **GPU Drivers installation**\ Download and install the Intel® Graphics Driver for Intel® Arc™ B-Series, A-Series, Intel® Iris® Xe Graphics, and Intel® Core™ Ultra Processors with Intel® Arc™ Graphics from [here](https://www.intel.com/content/www/us/en/download/785597/intel-arc-iris-xe-graphics-windows.html)\ **IMPORTANT:** Reboot the system after the installation. -2. **Git for Windows**\ +2. **Ollama Installation**\ + Download and install Ollama from [https://ollama.com/download](https://ollama.com/download) or use the command: + ```powershell + winget install Ollama.Ollama + ``` + + **Building Ollama with GPU Support (Vulkan)**\ + For advanced users who want to build Ollama from source with Vulkan GPU acceleration: + + a. **Install Vulkan SDK** + - Download and install from [https://vulkan.lunarg.com/sdk/home](https://vulkan.lunarg.com/sdk/home) + + b. **Install TDM-GCC** + - Download and install from [https://github.com/jmeubank/tdm-gcc/releases/tag/v10.3.0-tdm64-2](https://github.com/jmeubank/tdm-gcc/releases/tag/v10.3.0-tdm64-2) + + c. **Install Go SDK** + - Download and install Go v1.24.9 from [https://go.dev/dl/go1.24.9.windows-amd64.msi](https://go.dev/dl/go1.24.9.windows-amd64.msi) + + d. **Build Ollama with Vulkan** + ```powershell + # Set environment variables + set CGO_ENABLED=1 + set CGO_CFLAGS=-IC:\VulkanSDK\1.4.321.1\Include + + # Build with CMake + cmake -B build + cmake --build build --config Release -j14 + + # Build Go binary + go build + + # Run Ollama server (Terminal 1) + go run . serve + + # Test with a model (Terminal 2) + ollama run gemma3:270m + ``` + +3. **Git for Windows**\ Download and install Git from [here](https://git-scm.com/downloads/win) -3. **uv for Windows**\ +4. **uv for Windows**\ Steps to install `uv` in the Command Prompt are as follows. Please refer to the [documentation](https://docs.astral.sh/uv/getting-started/installation/) for more information. - ``` + ```powershell powershell -ExecutionPolicy ByPass -c "irm https://astral.sh/uv/install.ps1 | iex" ``` **NOTE:** Close and reopen the Command Prompt to recognize uv. ### For Linux: To install any software using commands, Open a new terminal window by right-clicking the terminal and selecting `New Window`. + 1. **GPU Drivers installation**\ Download and install the GPU drivers from [here](https://dgpu-docs.intel.com/driver/client/overview.html) -2. **Dependencies on Linux**\ +2. **Ollama Installation**\ + Install Ollama using the official script: + ```bash + curl -fsSL https://ollama.com/install.sh | sh + ``` + +3. **Dependencies on Linux**\ Install Curl, Wget, Git using the following commands: - For Debian/Ubuntu-based systems: - ``` + ```bash sudo apt update && sudo apt -y install curl wget git ``` - For RHEL/CentOS-based systems: - ``` + ```bash sudo dnf update && sudo dnf -y install curl wget git ``` @@ -125,50 +226,89 @@ To install any software using commands, Open a new terminal window by right-clic --- -## Running the Sample && execution output - -1. In the Command Prompt/terminal, navigate to `Video-Description-Generation-Query-Retrieval` folder after cloning the sample: - ``` +## Running the Sample + +### Quick Start with Streamlit (Recommended) + +1. **Navigate to project folder:** + ```bash cd ``` - -2. Log in to Hugging Face, generate a token, and download the required models and datasets:\ - `huggingface-cli` lets you interact directly with the Hugging Face Hub from a terminal. Log in to [Huggingface](https://huggingface.co/) with your credentials. You need a [User Access Token](https://huggingface.co/docs/hub/security-tokens) from your [Settings page](https://huggingface.co/settings/tokens). The User Access Token is used to authenticate your identity to the Hub.\ - Once you have your token, run the following command in your terminal. + +2. **Pull an Ollama vision model:** + ```bash + ollama pull qwen2.5-vl + # OR + ollaa pull qwen3-vl:latest + # OR + ollama pull llama3.2-vision + # OR + ollama pull llava ``` + +3. **Download the video dataset:** + + Log in to [Huggingface](https://huggingface.co/) and get a [User Access Token](https://huggingface.co/docs/hub/security-tokens) from your [Settings page](https://huggingface.co/settings/tokens). + + ```bash uv run huggingface-cli login - ``` - This command will prompt you for a token. Copy-paste yours and press Enter. - ``` - uv run huggingface-cli download Qwen/Qwen2.5-VL-3B-Instruct - uv run huggingface-cli download sentence-transformers/all-MiniLM-L6-v2 uv run huggingface-cli download stepfun-ai/Step-Video-T2V-Eval --repo-type dataset --local-dir ./Step-Video-T2V-Eval ``` -3. Launch Jupyter Lab and Run the notebook:\ - Open the [Video Description Generation Query Retrieval](./Video_Description_Generation_Query_Retrieval.ipynb) notebook in the Jupyter Lab. - - In the Jupyter Lab go to the kernel menu in the top-right corner of the notebook interface and choose default kernel i.e. `Python 3 (ipykernel)` from the available kernels list and run the code cells one by one in the notebook. - ``` - uv run jupyter lab - ``` - - If you are running the sample in the [Intel Tiber AI Cloud(ITAC)](https://ai.cloud.intel.com/), follow these steps in a new terminal session. Create and select the `uv_env` Jupyter kernel to get access to required python packages in the notebook. +4. **Launch the Streamlit application:** + ```bash + uv run streamlit run st_video_rag_demo.py ``` + + The app will open in your browser at `http://localhost:8501` + +5. **Use the application:** + - Go to "Process Videos" tab + - Configure settings (model, dataset folder, max videos) + - Click "Start Processing" + - Once complete, go to "Search Videos" tab + - Enter natural language queries to find videos + +### Alternative: Jupyter Notebook + +1. **Install dependencies:** + ```bash uv sync - uv run python -m ipykernel install --user --name=uv_env --display-name="uv_env" ``` -4. GPU utilization can be seen in the Task Manager while generating video descriptions for videos which are processing on Intel XPUs. - ![Generating_video_descriptions_using_Pytorch_XPU](./assets/Generating_video_descriptions_using_Pytorch_XPU.png) +2. **Launch Jupyter Lab:** + ```bash + uv run jupyter lab + ``` + + Open `Video_RAG_Ollama.ipynb` and run cells sequentially. -5. Relevant video will be displayed based on user query. - ![Video_display](./assets/Video_display.png) +3. **Expected Output:** + + - GPU utilization can be monitored in Task Manager (Windows) or nvidia-smi/intel_gpu_top (Linux) + - Processing 128 videos typically takes 10-60 minutes depending on hardware + - Search queries return results in < 100ms + - Videos displayed with similarity scores and descriptions --- ## Troubleshooting -- **Dependency Issues:** Run `uv clean` and then `uv sync`. -- **File Access Issues:** Restart the kernel and run the cells again. +**Ollama Issues:** +- **Ollama not accessible:** Check if Ollama is running with `ollama list`. Start with `ollama serve` if needed. +- **No vision model:** Pull a vision model: `ollama pull qwen2.5-vl` or `ollama pull llama3.2-vision` +- **Model too slow:** Try a smaller model like `llava` for faster inference + +**Application Issues:** +- **Dependency Issues:** Run `uv clean` and then `uv sync` +- **No videos found:** Ensure video folder path is correct and contains .mp4/.avi/.mov files +- **Database errors:** Delete `Video_descriptions_database_ollama` folder and reprocess +- **Poor search results:** Check that descriptions are detailed (view in "View All Descriptions" section) + +**Performance:** +- **Slow processing:** Reduce number of videos or use a faster model +- **Out of memory:** Process fewer videos at once or use a smaller model +- **GPU not utilized:** Ensure Intel GPU drivers are installed and Ollama is using GPU --- diff --git a/Video-Description-Generation-Query-Retrieval/Video_Description_Generation_Query_Retrieval.ipynb b/Video-Description-Generation-Query-Retrieval/Video_Description_Generation_Query_Retrieval.ipynb deleted file mode 100644 index 1fa010d..0000000 --- a/Video-Description-Generation-Query-Retrieval/Video_Description_Generation_Query_Retrieval.ipynb +++ /dev/null @@ -1,4823 +0,0 @@ -{ - "cells": [ - { - "cell_type": "markdown", - "id": "b584ead1-9a08-44eb-8c03-4ab98eb0f34a", - "metadata": {}, - "source": [ - "# Video Description Generation and Query Retrieval" - ] - }, - { - "cell_type": "markdown", - "id": "a50c359d-093d-49f2-8a53-43ae428355d1", - "metadata": {}, - "source": [ - "## Overview" - ] - }, - { - "cell_type": "markdown", - "id": "c84bdadd-ac84-4232-baf5-3394e51b6d3b", - "metadata": {}, - "source": [ - "This notebook demonstrates how to generate video descriptions using the [**Qwen 2.5 Vision-Language model**](https://github.com/QwenLM/Qwen2.5-VL) and store their embeddings in [**ChromaDB**](https://www.trychroma.com/) for efficient semantic search on **Intel® Core™ Ultra Processors**. The Qwen 2.5 Vision-Language model is loaded using the [**PyTorch XPU backend**](https://docs.pytorch.org/docs/stable/notes/get_start_xpu.html) to leverage Intel hardware acceleration.\\\n", - "For each video, a description is generated and stored as an embedding in ChromaDB. When a user submits a query, cosine similarity search is performed in ChromaDB to retrieve the most relevant video description. The matching video is then displayed inline.\\\n", - "This sample uses the videos from the [**stepfun-ai/Step-Video-T2V-Eval**](https://huggingface.co/datasets/stepfun-ai/Step-Video-T2V-Eval) Hugging Face dataset. For more information on the dataset and citation requirements, please refer to the [**Step-Video-T2V Technical Report paper**](https://arxiv.org/abs/2502.10248)." - ] - }, - { - "cell_type": "markdown", - "id": "4066302a-a785-4a4d-882d-26cba0f73f6c", - "metadata": {}, - "source": [ - "## Workflow" - ] - }, - { - "cell_type": "markdown", - "id": "087121d4-116e-4954-a84d-a8790774ec3c", - "metadata": {}, - "source": [ - "- During the initial data load, videos from the [*Step-Video-T2V-Eval*](https://huggingface.co/datasets/stepfun-ai/Step-Video-T2V-Eval) Hugging Face dataset is fed into the [*Qwen 2.5 Vision-Language model*](https://github.com/QwenLM/Qwen2.5-VL).\n", - "- Here, the [*Qwen2.5-VL-3B-Instruct*](https://huggingface.co/Qwen/Qwen2.5-VL-3B-Instruct) model variant is used to process these videos and generate descriptions. The Qwen 2.5 Vision-Language model is loaded using the [*PyTorch XPU backend*](https://docs.pytorch.org/docs/stable/notes/get_start_xpu.html) to leverage Intel hardware acceleration.\n", - "- Next, the generated video descriptions are converted into embeddings using [*Sentence Transformers*](https://sbert.net/), with the [*all-MiniLM-L6-v2 model*](https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2).\n", - "- These embeddings, along with the descriptions and video metadata, are stored in a persistent local [*ChromaDB*](https://www.trychroma.com/) collection. This is a one-time operation; since ChromaDB is local and persistent, it does not need to be repeated unless new videos are added.\n", - "- When a user submits a query, the text is similarly encoded into an embedding, which is then used to perform a semantic search (via cosine similarity) over the ChromaDB collection.\n", - "- The final result will be the most relevant video description and its associated video file name, and the video is displayed directly in the notebook." - ] - }, - { - "attachments": { - "0ed8e566-5603-4a27-a8ea-906c82934c53.png": { - "image/png": "" - } - }, - "cell_type": "markdown", - "id": "59f92287-32bd-4d39-85ef-7cab033a4259", - "metadata": {}, - "source": [ - "![Video_description_generation_and_query_retrieval_workflow.png](attachment:0ed8e566-5603-4a27-a8ea-906c82934c53.png)" - ] - }, - { - "cell_type": "markdown", - "id": "214bbd89-9b6d-48e8-904d-d08a7450fae0", - "metadata": {}, - "source": [ - "## Import necessary packages\n", - "Import all the necessary packages and libraries" - ] - }, - { - "cell_type": "code", - "execution_count": 1, - "id": "d24b9f9f-c73b-4f91-91f9-cae38eb75e34", - "metadata": {}, - "outputs": [], - "source": [ - "import os\n", - "import torch\n", - "import random\n", - "import shutil\n", - "import zipfile\n", - "import logging\n", - "import chromadb\n", - "import warnings\n", - "from tqdm import tqdm\n", - "from IPython.display import Video, display\n", - "from huggingface_hub import notebook_login\n", - "from qwen_vl_utils import process_vision_info\n", - "from sentence_transformers import SentenceTransformer\n", - "from transformers import Qwen2_5_VLForConditionalGeneration, AutoTokenizer, AutoProcessor\n", - "\n", - "logging.basicConfig(level=logging.INFO)\n", - "warnings.filterwarnings(\"ignore\")" - ] - }, - { - "cell_type": "markdown", - "id": "6fd9cf5b-3465-43d0-87bd-b1df7831d5c5", - "metadata": {}, - "source": [ - "## Login to Huggingface to download the models" - ] - }, - { - "cell_type": "markdown", - "id": "f306fbcb-82d7-482a-8b53-b1486f81d639", - "metadata": {}, - "source": [ - "- Log in to [Huggingface](https://huggingface.co/) using your credentials.\n", - "- You’ll need a [User Access Token](https://huggingface.co/docs/hub/security-tokens), which you can generate from your [Settings page](https://huggingface.co/settings/tokens). This token is used to authenticate your identity with the Hugging Face Hub.\n", - "- Once you've generated the token, copy it and keep it secure. Then, run the cell below and paste your access token when prompted." - ] - }, - { - "cell_type": "code", - "execution_count": 2, - "id": "36f2f1da-9918-412e-b6f1-41eaf41946ed", - "metadata": {}, - "outputs": [ - { - "data": { - "application/vnd.jupyter.widget-view+json": { - "model_id": "e1cf3cc1e5304bc893397a834433b6d6", - "version_major": 2, - "version_minor": 0 - }, - "text/plain": [ - "VBox(children=(HTML(value='
\n", - " Generating video descriptions and updating the database. This may take some time.\n", - "" - ] - }, - { - "cell_type": "code", - "execution_count": 12, - "id": "829fedae-16d5-47f8-8d2a-447e78d3e3bf", - "metadata": { - "scrolled": true - }, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - " 0%| | 0/128 [00:00\n", - " Your browser does not support the video element.\n", - " " - ], - "text/plain": [ - "" - ] - }, - "metadata": {}, - "output_type": "display_data" - } - ], - "source": [ - "display_video(results)" - ] - }, - { - "cell_type": "markdown", - "id": "c55db9d3-b2e7-4826-8c1b-a1acb288ec9d", - "metadata": { - "scrolled": true - }, - "source": [ - "## Remove the database\n", - "Remove the local database if it is not needed." - ] - }, - { - "cell_type": "code", - "execution_count": 15, - "id": "c9a08316-779e-4c35-bb83-242f6a9e0a37", - "metadata": {}, - "outputs": [], - "source": [ - "def delete_database():\n", - " \"\"\"\n", - " Delete the database directory.\n", - "\n", - " Raises:\n", - " Exception: Raises an exception if there is any error while deleting the database.\n", - " \"\"\"\n", - " database_folder = \"Video_descriptions_database\"\n", - " if os.path.exists(database_folder):\n", - " logging.info(\"You are about to delete the database. Once deleted, it will no longer be available, and you will need to regenerate and store the video descriptions again.\")\n", - " database_deletion = 'no'\n", - " if database_deletion == 'yes':\n", - " try:\n", - " shutil.rmtree(database_folder)\n", - " logging.info(\"Database deleted!\")\n", - " except Exception as e:\n", - " logging.exception(f\"Error while deleting the database: {str(e)}\")\n", - " else:\n", - " logging.info(\"Database not deleted\")\n", - " else:\n", - " logging.info(\"Database is not available\")" - ] - }, - { - "cell_type": "code", - "execution_count": 16, - "id": "47d4486c-9165-4ebe-85be-7ed036634624", - "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "INFO:root:You are about to delete the database. Once deleted, it will no longer be available, and you will need to regenerate and store the video descriptions again.\n", - "INFO:root:Database not deleted\n" - ] - } - ], - "source": [ - "delete_database()" - ] - }, - { - "cell_type": "markdown", - "id": "fe8a1e8e-aefa-40fb-bc31-18320c6b21f5", - "metadata": {}, - "source": [ - "## Dataset Citations" - ] - }, - { - "cell_type": "markdown", - "id": "03fb3224-6818-4124-a97b-ec568c67ef3e", - "metadata": {}, - "source": [ - " @misc{ma2025stepvideot2vtechnicalreportpractice, \n", - " title={Step-Video-T2V Technical Report: The Practice, Challenges, and Future of Video Foundation Model}, \n", - " author={Guoqing Ma and Haoyang Huang and Kun Yan and Liangyu Chen and Nan Duan and Shengming Yin and Changyi Wan and Ranchen Ming and Xiaoniu Song and Xing Chen and Yu Zhou and Deshan Sun and Deyu Zhou and Jian Zhou and Kaijun Tan and Kang An and Mei Chen and Wei Ji and Qiling Wu and Wen Sun and Xin Han and Yanan Wei and Zheng Ge and Aojie Li and Bin Wang and Bizhu Huang and Bo Wang and Brian Li and Changxing Miao and Chen Xu and Chenfei Wu and Chenguang Yu and Dapeng Shi and Dingyuan Hu and Enle Liu and Gang Yu and Ge Yang and Guanzhe Huang and Gulin Yan and Haiyang Feng and Hao Nie and Haonan Jia and Hanpeng Hu and Hanqi Chen and Haolong Yan and Heng Wang and Hongcheng Guo and Huilin Xiong and Huixin Xiong and Jiahao Gong and Jianchang Wu and Jiaoren Wu and Jie Wu and Jie Yang and Jiashuai Liu and Jiashuo Li and Jingyang Zhang and Junjing Guo and Junzhe Lin and Kaixiang Li and Lei Liu and Lei Xia and Liang Zhao and Liguo Tan and Liwen Huang and Liying Shi and Ming Li and Mingliang Li and Muhua Cheng and Na Wang and Qiaohui Chen and Qinglin He and Qiuyan Liang and Quan Sun and Ran Sun and Rui Wang and Shaoliang Pang and Shiliang Yang and Sitong Liu and Siqi Liu and Shuli Gao and Tiancheng Cao and Tianyu Wang and Weipeng Ming and Wenqing He and Xu Zhao and Xuelin Zhang and Xianfang Zeng and Xiaojia Liu and Xuan Yang and Yaqi Dai and Yanbo Yu and Yang Li and Yineng Deng and Yingming Wang and Yilei Wang and Yuanwei Lu and Yu Chen and Yu Luo and Yuchu Luo and Yuhe Yin and Yuheng Feng and Yuxiang Yang and Zecheng Tang and Zekai Zhang and Zidong Yang and Binxing Jiao and Jiansheng Chen and Jing Li and Shuchang Zhou and Xiangyu Zhang and Xinhao Zhang and Yibo Zhu and Heung-Yeung Shum and Daxin Jiang},\n", - " year={2025},\n", - " eprint={2502.10248},\n", - " archivePrefix={arXiv},\n", - " primaryClass={cs.CV},\n", - " url={https://arxiv.org/abs/2502.10248}, \n", - " }" - ] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3 (ipykernel)", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.12.10" - }, - "widgets": { - "application/vnd.jupyter.widget-state+json": { - "state": { - "05a1e4abf5b046c29125e02d004059a0": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "HTMLStyleModel", - "state": { - "description_width": "", - "font_size": null, - "text_color": null - } - }, - "06788d02ed4a4696affe2a2753bc88da": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "HTMLModel", - "state": { - "layout": "IPY_MODEL_a8b4bfd9c16f471992060cc05d45d22d", - "style": "IPY_MODEL_9cb93838bc474e28af02ee42b4bd7b6c", - "value": "\nPro Tip: If you don't already have one, you can create a dedicated\n'notebooks' token with 'write' access, that you can then easily reuse for all\nnotebooks.
" - } - }, - "0d018534eeb949a187ce8fbbd9bfa941": { - "model_module": "@jupyter-widgets/base", - "model_module_version": "2.0.0", - "model_name": "LayoutModel", - "state": {} - }, - "1cd422a26899462c816a8bd827e8a94c": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "VBoxModel", - "state": { - "children": [ - "IPY_MODEL_de408595e9464d8882c9163de8c250fa", - "IPY_MODEL_dae4f862127b41468caa1aab709bc1eb", - "IPY_MODEL_36b84737080741b386a5e67a7e71098e", - "IPY_MODEL_78cf341e3b764c219fa49e431355ca86", - "IPY_MODEL_06788d02ed4a4696affe2a2753bc88da" - ], - "layout": "IPY_MODEL_a1d2eba2d2984f7cafd0d461628cf4c4" - } - }, - "1d729736fbcb482dac67802542714c5e": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "FloatProgressModel", - "state": { - "bar_style": "success", - "layout": "IPY_MODEL_8dd3c7571a7d4e02a1cf571167aa5e00", - "max": 2, - "style": "IPY_MODEL_eb7a88fd11554b84b5c848501000af91", - "value": 2 - } - }, - "1f74aa3526654d0da63f0cb3463386fb": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "CheckboxStyleModel", - "state": { - "description_width": "" - } - }, - "2a6ddf66b0a34b4da63c64e9df859465": { - "model_module": "@jupyter-widgets/base", - "model_module_version": "2.0.0", - "model_name": "LayoutModel", - "state": {} - }, - "36b84737080741b386a5e67a7e71098e": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "CheckboxModel", - "state": { - "description": "Add token as git credential?", - "disabled": false, - "layout": "IPY_MODEL_c38387ffede745e68b3be6ec9f61a1eb", - "style": "IPY_MODEL_1f74aa3526654d0da63f0cb3463386fb", - "value": true - } - }, - "6714fabaf6854f379881bd8ac800a18d": { - "model_module": "@jupyter-widgets/base", - "model_module_version": "2.0.0", - "model_name": "LayoutModel", - "state": {} - }, - "78cf341e3b764c219fa49e431355ca86": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "ButtonModel", - "state": { - "description": "Login", - "layout": "IPY_MODEL_c282851109ab4a219209d4ef7669bb0d", - "style": "IPY_MODEL_94bd57adb50c49b79486e45acac66f90", - "tooltip": null - } - }, - "8dd3c7571a7d4e02a1cf571167aa5e00": { - "model_module": "@jupyter-widgets/base", - "model_module_version": "2.0.0", - "model_name": "LayoutModel", - "state": {} - }, - "90f2f0e3475c4743a832dcd3f061c1fa": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "TextStyleModel", - "state": { - "description_width": "", - "font_size": null, - "text_color": null - } - }, - "94bd57adb50c49b79486e45acac66f90": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "ButtonStyleModel", - "state": { - "font_family": null, - "font_size": null, - "font_style": null, - "font_variant": null, - "font_weight": null, - "text_color": null, - "text_decoration": null - } - }, - "9cb93838bc474e28af02ee42b4bd7b6c": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "HTMLStyleModel", - "state": { - "description_width": "", - "font_size": null, - "text_color": null - } - }, - "a1d2eba2d2984f7cafd0d461628cf4c4": { - "model_module": "@jupyter-widgets/base", - "model_module_version": "2.0.0", - "model_name": "LayoutModel", - "state": { - "align_items": "center", - "display": "flex", - "flex_flow": "column", - "width": "50%" - } - }, - "a8b4bfd9c16f471992060cc05d45d22d": { - "model_module": "@jupyter-widgets/base", - "model_module_version": "2.0.0", - "model_name": "LayoutModel", - "state": {} - }, - "bbe8609ac6354ab0b9405922f151f441": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "HTMLModel", - "state": { - "layout": "IPY_MODEL_0d018534eeb949a187ce8fbbd9bfa941", - "style": "IPY_MODEL_05a1e4abf5b046c29125e02d004059a0", - "value": " 2/2 [00:44<00:00, 22.01s/it]" - } - }, - "c282851109ab4a219209d4ef7669bb0d": { - "model_module": "@jupyter-widgets/base", - "model_module_version": "2.0.0", - "model_name": "LayoutModel", - "state": {} - }, - "c38387ffede745e68b3be6ec9f61a1eb": { - "model_module": "@jupyter-widgets/base", - "model_module_version": "2.0.0", - "model_name": "LayoutModel", - "state": {} - }, - "cebd89176601477fa21d9184db415d90": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "HTMLStyleModel", - "state": { - "description_width": "", - "font_size": null, - "text_color": null - } - }, - "ced14b38c76c4b81b27d403077e95272": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "HTMLStyleModel", - "state": { - "description_width": "", - "font_size": null, - "text_color": null - } - }, - "dac567963bd54bdead3f259b41438c6b": { - "model_module": "@jupyter-widgets/base", - "model_module_version": "2.0.0", - "model_name": "LayoutModel", - "state": {} - }, - "dae4f862127b41468caa1aab709bc1eb": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "PasswordModel", - "state": { - "description": "Token:", - "layout": "IPY_MODEL_6714fabaf6854f379881bd8ac800a18d", - "style": "IPY_MODEL_90f2f0e3475c4743a832dcd3f061c1fa" - } - }, - "de408595e9464d8882c9163de8c250fa": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "HTMLModel", - "state": { - "layout": "IPY_MODEL_dac567963bd54bdead3f259b41438c6b", - "style": "IPY_MODEL_ced14b38c76c4b81b27d403077e95272", - "value": "

Copy a token from your Hugging Face\ntokens page and paste it below.
Immediately click login after copying\nyour token or it might be stored in plain text in this notebook file.
" - } - }, - "e633a8f0fc8d439abba63be9e41ab3c6": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "HTMLModel", - "state": { - "layout": "IPY_MODEL_ef7a0c0a6fe64d0a961772ac85c741c2", - "style": "IPY_MODEL_cebd89176601477fa21d9184db415d90", - "value": "Loading checkpoint shards: 100%" - } - }, - "eb7a88fd11554b84b5c848501000af91": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "ProgressStyleModel", - "state": { - "description_width": "" - } - }, - "ef7a0c0a6fe64d0a961772ac85c741c2": { - "model_module": "@jupyter-widgets/base", - "model_module_version": "2.0.0", - "model_name": "LayoutModel", - "state": {} - }, - "ff01fa9425494c56a00236861a40e688": { - "model_module": "@jupyter-widgets/controls", - "model_module_version": "2.0.0", - "model_name": "HBoxModel", - "state": { - "children": [ - "IPY_MODEL_e633a8f0fc8d439abba63be9e41ab3c6", - "IPY_MODEL_1d729736fbcb482dac67802542714c5e", - "IPY_MODEL_bbe8609ac6354ab0b9405922f151f441" - ], - "layout": "IPY_MODEL_2a6ddf66b0a34b4da63c64e9df859465" - } - } - }, - "version_major": 2, - "version_minor": 0 - } - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} diff --git a/Video-Description-Generation-Query-Retrieval/Video_RAG_Ollama.ipynb b/Video-Description-Generation-Query-Retrieval/Video_RAG_Ollama.ipynb new file mode 100644 index 0000000..128785f --- /dev/null +++ b/Video-Description-Generation-Query-Retrieval/Video_RAG_Ollama.ipynb @@ -0,0 +1,767 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "79fcc40b-974c-4d09-9cb4-99f0b6706f33", + "metadata": {}, + "source": [ + "# Video Description Generation and Query Retrieval" + ] + }, + { + "cell_type": "markdown", + "id": "9ae88b40", + "metadata": {}, + "source": [ + "## Overview" + ] + }, + { + "cell_type": "markdown", + "id": "3a593030", + "metadata": {}, + "source": [ + "This notebook demonstrates how to generate video descriptions using the **Qwen2.5-VL (Qwen 2.5 Vision-Language model)** via **Ollama** and store their embeddings in **ChromaDB** for efficient semantic search on **Intel® Core™ Ultra Processors**. \n", + "\n", + "For each video, a description is generated using Ollama's vision model and stored as an embedding in ChromaDB. When a user submits a query, cosine similarity search is performed in ChromaDB to retrieve the most relevant video description. The matching video is then displayed inline.\n", + "\n", + "This sample uses the videos from the [**stepfun-ai/Step-Video-T2V-Eval**](https://huggingface.co/datasets/stepfun-ai/Step-Video-T2V-Eval) Hugging Face dataset.\n", + "\n", + "\n", + "- Uses Ollama as the GPU backend\n", + "- Simpler setup - no complex model loading required\n", + "- Uses Qwen2.5-VL vision model through Ollama\n", + "- ChromaDB and semantic search functionality" + ] + }, + { + "cell_type": "markdown", + "id": "ad8ec879", + "metadata": {}, + "source": [ + "## Workflow" + ] + }, + { + "cell_type": "markdown", + "id": "274819d8", + "metadata": {}, + "source": [ + "- During the initial data load, videos from the dataset are processed using **Ollama's Qwen2.5-VL vision model**\n", + "- The model generates descriptions for each video\n", + "- Generated video descriptions are converted into embeddings using **Sentence Transformers** (all-MiniLM-L6-v2 model)\n", + "- These embeddings, along with descriptions and video metadata, are stored in a persistent local **ChromaDB** collection\n", + "- When a user submits a query, the text is encoded into an embedding and used to perform semantic search (via cosine similarity) over the ChromaDB collection\n", + "- The most relevant video description and associated video file are returned and displayed" + ] + }, + { + "cell_type": "markdown", + "id": "0f4c8809", + "metadata": {}, + "source": [ + "## Prerequisites\n", + "\n", + "Before running this notebook, ensure you have:\n", + "1. **Ollama installed** and running locally\n", + "2. **Qwen2.5-VL vision model** pulled in Ollama: `ollama pull llava` or `ollama pull llama3.2-vision` (or any vision-capable model)\n", + "3. The video dataset downloaded" + ] + }, + { + "cell_type": "markdown", + "id": "e6ee3aa8-d8c6-44be-869b-422cc728d452", + "metadata": {}, + "source": [ + "## Setup: Install Dependencies\n", + "\n", + "Run this cell first to ensure all required packages are installed in the current environment." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "4ca1579a", + "metadata": {}, + "outputs": [], + "source": [ + "import sys\n", + "import subprocess\n", + "\n", + "# Install dependencies if not already installed\n", + "required_packages = [\n", + " \"ollama>=0.4.0\",\n", + " \"chromadb>=1.0.12\",\n", + " \"sentence-transformers>=4.1.0\",\n", + " \"opencv-python>=4.8.0\",\n", + " \"numpy>=1.24.0\",\n", + " \"tqdm>=4.65.0\",\n", + "]\n", + "\n", + "print(\"Checking and installing required packages...\")\n", + "for package in required_packages:\n", + " try:\n", + " package_name = package.split(\">=\")[0]\n", + " __import__(package_name.replace(\"-\", \"_\"))\n", + " print(f\"✓ {package_name} already installed\")\n", + " except ImportError:\n", + " print(f\"Installing {package}...\")\n", + " subprocess.check_call([sys.executable, \"-m\", \"pip\", \"install\", package])\n", + " print(f\"✓ {package} installed successfully\")\n", + "\n", + "print(\"\\n✅ All dependencies are ready!\")" + ] + }, + { + "cell_type": "markdown", + "id": "3c8bc613", + "metadata": {}, + "source": [ + "## Building Ollama with GPU Support (Vulkan)\n", + "\n", + "For advanced users who want to build Ollama from source with Vulkan GPU acceleration on Windows:\n", + "\n", + "### Installation Steps\n", + "\n", + "1. **Install Vulkan SDK**\n", + " - Download from: https://vulkan.lunarg.com/sdk/home\n", + "\n", + "2. **Install TDM-GCC**\n", + " - Download from: https://github.com/jmeubank/tdm-gcc/releases/tag/v10.3.0-tdm64-2\n", + "\n", + "3. **Install Go SDK**\n", + " - Download Go v1.24.9: https://go.dev/dl/go1.24.9.windows-amd64.msi\n", + "\n", + "4. **Build Ollama**\n", + " ```bash\n", + " # Set environment variables\n", + " set CGO_ENABLED=1\n", + " set CGO_CFLAGS=-IC:\\VulkanSDK\\1.4.321.1\\Include\n", + " \n", + " # Build with CMake\n", + " cmake -B build\n", + " cmake --build build --config Release -j14\n", + " \n", + " # Build Go binary\n", + " go build\n", + " \n", + " # Run Ollama server (Terminal 1)\n", + " go run . serve\n", + " \n", + " # Test with a model (Terminal 2)\n", + " ollama run gemma3:270m\n", + " ```\n", + "\n", + "**Note:** This is for advanced users who want to compile Ollama from source. The pre-built Ollama installation works fine for most users." + ] + }, + { + "cell_type": "markdown", + "id": "90f262ea", + "metadata": {}, + "source": [ + "## Import necessary packages" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "f012ada9", + "metadata": {}, + "outputs": [], + "source": [ + "import os\n", + "import base64\n", + "import random\n", + "import shutil\n", + "import logging\n", + "import chromadb\n", + "import warnings\n", + "import ollama\n", + "from tqdm import tqdm\n", + "from IPython.display import Video, display\n", + "from sentence_transformers import SentenceTransformer\n", + "\n", + "logging.basicConfig(level=logging.INFO)\n", + "warnings.filterwarnings(\"ignore\")" + ] + }, + { + "cell_type": "markdown", + "id": "699f3cf3", + "metadata": {}, + "source": [ + "## Configuration" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "600359d0", + "metadata": {}, + "outputs": [], + "source": [ + "# Ollama configuration\n", + "OLLAMA_BASE_URL = \"http://localhost:11434\"\n", + "VISION_MODEL = \"llama3.2-vision\" # or \"llava\" or other vision models\n", + "EMBEDDING_MODEL = \"all-MiniLM-L6-v2\"\n", + "\n", + "# Database configuration\n", + "DATABASE_PATH = \"./Video_descriptions_database_ollama\"\n", + "COLLECTION_NAME = \"Video_descriptions_ollama\"" + ] + }, + { + "cell_type": "markdown", + "id": "7bc20fa8", + "metadata": {}, + "source": [ + "## Get video file paths" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "f30e37db", + "metadata": {}, + "outputs": [], + "source": [ + "def get_video_paths():\n", + " \"\"\"\n", + " Select the number of videos to process and return the selected video file paths.\n", + "\n", + " Returns:\n", + " list: Selected list of video files paths.\n", + " \"\"\"\n", + " try:\n", + " dataset_folder = \"Step-Video-T2V-Eval\"\n", + " max_videos_to_select = 128\n", + " video_extensions = ['.mp4', '.avi', '.mov', '.mkv', '.flv', '.wmv']\n", + " video_files = []\n", + " \n", + " for root, dirs, files in os.walk(dataset_folder):\n", + " video_files.extend([\n", + " os.path.join(root, f) for f in files \n", + " if any(f.lower().endswith(ext) for ext in video_extensions)\n", + " ])\n", + " \n", + " total_video_files = len(video_files)\n", + " num_videos_to_select = min(total_video_files, max_videos_to_select)\n", + " \n", + " random.seed(42)\n", + " selected_video_files = random.sample(video_files, num_videos_to_select)\n", + " \n", + " logging.info(f\" Total number of video files found: {total_video_files}\")\n", + " logging.info(f\" Selected {num_videos_to_select} video files\")\n", + " \n", + " return selected_video_files\n", + " except Exception as e:\n", + " logging.exception(f\" Error while extracting the video paths: {str(e)}\")\n", + " return []" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "cef968d6", + "metadata": {}, + "outputs": [], + "source": [ + "selected_video_files = get_video_paths()" + ] + }, + { + "cell_type": "markdown", + "id": "3541e91c", + "metadata": {}, + "source": [ + "## Initialize models\n", + "Initialize the Sentence Transformer model for embeddings." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "9c252d8c", + "metadata": {}, + "outputs": [], + "source": [ + "def initialize_embedding_model():\n", + " \"\"\"\n", + " Initialize Sentence Transformer model for generating embeddings.\n", + "\n", + " Returns:\n", + " SentenceTransformer: The initialized embedding model.\n", + " \"\"\"\n", + " try:\n", + " logging.info(f\" Loading Sentence Transformer Model: {EMBEDDING_MODEL}\")\n", + " embedding_model = SentenceTransformer(EMBEDDING_MODEL)\n", + " return embedding_model\n", + " except Exception as e:\n", + " logging.exception(f\" Error while loading the embedding model: {str(e)}\")\n", + " return None" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "21f8648c", + "metadata": {}, + "outputs": [], + "source": [ + "embedding_model = initialize_embedding_model()" + ] + }, + { + "cell_type": "markdown", + "id": "2d7fe5a1", + "metadata": {}, + "source": [ + "## Encode video frame to base64\n", + "Utility function to encode video frames for Ollama API." + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "9666b01e", + "metadata": {}, + "outputs": [], + "source": [ + "def encode_video_frame(video_path, frame_time=0):\n", + " \"\"\"\n", + " Extract and encode a frame from the video as base64.\n", + " \n", + " Args:\n", + " video_path (str): Path to the video file.\n", + " frame_time (float): Time in seconds to extract the frame.\n", + " \n", + " Returns:\n", + " str: Base64 encoded image string or None if extraction fails.\n", + " \"\"\"\n", + " try:\n", + " import cv2\n", + " \n", + " cap = cv2.VideoCapture(video_path)\n", + " if not cap.isOpened():\n", + " logging.error(f\" Cannot open video: {video_path}\")\n", + " return None\n", + " \n", + " # Set position to specific time\n", + " fps = cap.get(cv2.CAP_PROP_FPS)\n", + " frame_number = int(frame_time * fps)\n", + " cap.set(cv2.CAP_PROP_POS_FRAMES, frame_number)\n", + " \n", + " ret, frame = cap.read()\n", + " cap.release()\n", + " \n", + " if not ret:\n", + " logging.error(f\" Cannot read frame from video: {video_path}\")\n", + " return None\n", + " \n", + " # Encode frame to base64\n", + " _, buffer = cv2.imencode('.jpg', frame)\n", + " frame_base64 = base64.b64encode(buffer).decode('utf-8')\n", + " \n", + " return frame_base64\n", + " except Exception as e:\n", + " logging.exception(f\" Error encoding video frame: {str(e)}\")\n", + " return None" + ] + }, + { + "cell_type": "markdown", + "id": "77ce50cd", + "metadata": {}, + "source": [ + "## Generate video description using Ollama" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "afb851d6", + "metadata": {}, + "outputs": [], + "source": [ + "def generate_video_description_ollama(video_path):\n", + " \"\"\"\n", + " Generate video description using Ollama vision model.\n", + " \n", + " Args:\n", + " video_path (str): Path to the video file.\n", + " \n", + " Returns:\n", + " str: Generated description of the video.\n", + " \"\"\"\n", + " try:\n", + " # Extract a frame from the middle of the video\n", + " frame_base64 = encode_video_frame(video_path, frame_time=2.0)\n", + " \n", + " if not frame_base64:\n", + " return \"Unable to process video\"\n", + " \n", + " # Use Ollama API to generate description\n", + " response = ollama.chat(\n", + " model=VISION_MODEL,\n", + " messages=[{\n", + " 'role': 'user',\n", + " 'content': 'Describe this sports video in detail. Focus on the main activity, people, objects, and setting.',\n", + " 'images': [frame_base64]\n", + " }]\n", + " )\n", + " \n", + " description = response['message']['content']\n", + " return description\n", + " \n", + " except Exception as e:\n", + " logging.exception(f\" Error generating description with Ollama: {str(e)}\")\n", + " return \"Error generating description\"" + ] + }, + { + "cell_type": "markdown", + "id": "d381f556", + "metadata": {}, + "source": [ + "## Get or create ChromaDB collection" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "1e7cdef6", + "metadata": {}, + "outputs": [], + "source": [ + "def get_or_create_database():\n", + " \"\"\"\n", + " Connects to or creates a persistent ChromaDB collection.\n", + "\n", + " Returns:\n", + " tuple: (collection, existing_descriptions)\n", + " \"\"\"\n", + " try:\n", + " client = chromadb.PersistentClient(path=DATABASE_PATH)\n", + " collection = client.get_or_create_collection(\n", + " name=COLLECTION_NAME,\n", + " metadata={\"hnsw:space\": \"cosine\"}\n", + " )\n", + " \n", + " logging.info(\" Checking existing descriptions in database...\")\n", + " all_items = collection.get(include=[\"metadatas\", \"documents\"])\n", + " \n", + " existing_descriptions = {}\n", + " for metadata, doc in zip(all_items['metadatas'], all_items['documents']):\n", + " existing_descriptions[metadata['video_filename']] = doc\n", + " \n", + " logging.info(f\" Found {len(existing_descriptions)} existing descriptions\")\n", + " return collection, existing_descriptions\n", + " \n", + " except Exception as e:\n", + " logging.exception(f\" Error while checking database: {str(e)}\")\n", + " return None, {}" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "5d26017c", + "metadata": {}, + "outputs": [], + "source": [ + "collection, existing_descriptions = get_or_create_database()" + ] + }, + { + "cell_type": "markdown", + "id": "8438c801", + "metadata": {}, + "source": [ + "## Generate and store video descriptions\n", + "\n", + "Each video will be processed:\n", + "1. Check if description already exists in database\n", + "2. If not, generate description using Ollama\n", + "3. Create embedding and store in ChromaDB" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "b2e69a08", + "metadata": {}, + "outputs": [], + "source": [ + "def generate_and_store_video_descriptions(selected_video_files, collection, existing_descriptions, embedding_model):\n", + " \"\"\"\n", + " Generate and store video descriptions using Ollama.\n", + " \n", + " Args:\n", + " selected_video_files (list): List of video file paths.\n", + " collection: ChromaDB collection object.\n", + " existing_descriptions (dict): Already processed videos.\n", + " embedding_model: Sentence Transformer model.\n", + " \"\"\"\n", + " try:\n", + " video_descriptions = {}\n", + " \n", + " for video_file in tqdm(selected_video_files, desc=\"Processing videos\"):\n", + " video_filename = os.path.basename(video_file)\n", + " \n", + " # Skip if already processed\n", + " if video_filename in existing_descriptions:\n", + " logging.info(f\" Skipping {video_filename} - already in database\")\n", + " video_descriptions[video_file] = existing_descriptions[video_filename]\n", + " continue\n", + " \n", + " logging.info(f\"\\n Processing {video_filename} using Ollama...\")\n", + " \n", + " # Generate description using Ollama\n", + " description_text = generate_video_description_ollama(video_file)\n", + " video_descriptions[video_file] = description_text\n", + " \n", + " logging.info(f\" Generated description: {description_text}\\n\")\n", + " \n", + " # Create embedding\n", + " embedding = embedding_model.encode(description_text).tolist()\n", + " \n", + " # Store in ChromaDB\n", + " collection.add(\n", + " embeddings=[embedding],\n", + " documents=[description_text],\n", + " metadatas=[{\"video_filename\": video_filename}],\n", + " ids=[video_file]\n", + " )\n", + " \n", + " logging.info(f\" Added {video_filename} to database\\n\")\n", + " \n", + " logging.info(f\"\\n Processed {len(video_descriptions)} videos\")\n", + " logging.info(f\" Database now has {collection.count()} total descriptions\")\n", + " \n", + " except Exception as e:\n", + " logging.exception(f\" Error while generating and storing descriptions: {str(e)}\")" + ] + }, + { + "cell_type": "markdown", + "id": "07d2a1ea", + "metadata": {}, + "source": [ + "
\n", + " Generating video descriptions using Ollama. This may take some time.\n", + "
" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "d1290f57", + "metadata": {}, + "outputs": [], + "source": [ + "generate_and_store_video_descriptions(selected_video_files, collection, existing_descriptions, embedding_model)" + ] + }, + { + "cell_type": "markdown", + "id": "1bb8b66c", + "metadata": {}, + "source": [ + "## Query the database" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "1d801454", + "metadata": {}, + "outputs": [], + "source": [ + "def query_videos_descriptions(query, collection, embedding_model):\n", + " \"\"\"\n", + " Query ChromaDB collection to find similar videos.\n", + " \n", + " Args:\n", + " query (str): User query.\n", + " collection: ChromaDB collection object.\n", + " embedding_model: Sentence Transformer model.\n", + " \n", + " Returns:\n", + " dict: Query results.\n", + " \"\"\"\n", + " try:\n", + " query_embedding = embedding_model.encode(query).tolist()\n", + " \n", + " results = collection.query(\n", + " query_embeddings=[query_embedding],\n", + " n_results=1,\n", + " include=[\"documents\", \"metadatas\", \"distances\"]\n", + " )\n", + " \n", + " logging.info(f\" Search results for: '{query}'\\n\")\n", + " \n", + " for doc, metadata, distance in zip(\n", + " results['documents'][0],\n", + " results['metadatas'][0],\n", + " results['distances'][0]\n", + " ):\n", + " similarity_score = 1 - distance\n", + " logging.info(f\" Video filename: {metadata['video_filename']}\")\n", + " logging.info(f\" Similarity score: {similarity_score:.3f}\")\n", + " logging.info(f\" Distance: {distance:.3f}\")\n", + " logging.info(f\" Video description: {doc}\\n\")\n", + " \n", + " return results\n", + " \n", + " except Exception as e:\n", + " logging.exception(f\" Error while querying video descriptions: {str(e)}\")\n", + " return None" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "ed608765", + "metadata": {}, + "outputs": [], + "source": [ + "query = \"Give me the video of the birds and blue sea\"\n", + "results = query_videos_descriptions(query, collection, embedding_model)" + ] + }, + { + "cell_type": "markdown", + "id": "9399bfd5", + "metadata": {}, + "source": [ + "## Display the video" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "9e55e905", + "metadata": {}, + "outputs": [], + "source": [ + "def display_video(results):\n", + " \"\"\"\n", + " Display the video based on query results.\n", + " \n", + " Args:\n", + " results (dict): Query results.\n", + " \"\"\"\n", + " try:\n", + " if results and results['ids']:\n", + " video_path = results['ids'][0][0]\n", + " video = Video(video_path, width=600, height=400)\n", + " display(video)\n", + " else:\n", + " logging.info(\" No video found\")\n", + " except Exception as e:\n", + " logging.exception(f\" Error while displaying the video: {str(e)}\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "bf235da1", + "metadata": {}, + "outputs": [], + "source": [ + "display_video(results)" + ] + }, + { + "cell_type": "markdown", + "id": "fda2e217", + "metadata": {}, + "source": [ + "## Remove the database" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "9d6ba65c", + "metadata": {}, + "outputs": [], + "source": [ + "def delete_database():\n", + " \"\"\"\n", + " Delete the database directory.\n", + " \"\"\"\n", + " if os.path.exists(DATABASE_PATH):\n", + " logging.info(\"Database deletion option available.\")\n", + " database_deletion = 'no' # Change to 'yes' to delete\n", + " \n", + " if database_deletion == 'yes':\n", + " try:\n", + " shutil.rmtree(DATABASE_PATH)\n", + " logging.info(\" Database deleted!\")\n", + " except Exception as e:\n", + " logging.exception(f\" Error while deleting database: {str(e)}\")\n", + " else:\n", + " logging.info(\" Database not deleted\")\n", + " else:\n", + " logging.info(\" Database is not available\")" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "b8070cae", + "metadata": {}, + "outputs": [], + "source": [ + "delete_database()" + ] + }, + { + "cell_type": "markdown", + "id": "4a2bba50", + "metadata": {}, + "source": [ + "## Dataset Citations" + ] + }, + { + "cell_type": "markdown", + "id": "7613a434", + "metadata": {}, + "source": [ + " @misc{ma2025stepvideot2vtechnicalreportpractice, \n", + " title={Step-Video-T2V Technical Report: The Practice, Challenges, and Future of Video Foundation Model}, \n", + " author={Guoqing Ma and Haoyang Huang and Kun Yan and Liangyu Chen and Nan Duan and Shengming Yin and Changyi Wan and Ranchen Ming and Xiaoniu Song and Xing Chen and Yu Zhou and Deshan Sun and Deyu Zhou and Jian Zhou and Kaijun Tan and Kang An and Mei Chen and Wei Ji and Qiling Wu and Wen Sun and Xin Han and Yanan Wei and Zheng Ge and Aojie Li and Bin Wang and Bizhu Huang and Bo Wang and Brian Li and Changxing Miao and Chen Xu and Chenfei Wu and Chenguang Yu and Dapeng Shi and Dingyuan Hu and Enle Liu and Gang Yu and Ge Yang and Guanzhe Huang and Gulin Yan and Haiyang Feng and Hao Nie and Haonan Jia and Hanpeng Hu and Hanqi Chen and Haolong Yan and Heng Wang and Hongcheng Guo and Huilin Xiong and Huixin Xiong and Jiahao Gong and Jianchang Wu and Jiaoren Wu and Jie Wu and Jie Yang and Jiashuai Liu and Jiashuo Li and Jingyang Zhang and Junjing Guo and Junzhe Lin and Kaixiang Li and Lei Liu and Lei Xia and Liang Zhao and Liguo Tan and Liwen Huang and Liying Shi and Ming Li and Mingliang Li and Muhua Cheng and Na Wang and Qiaohui Chen and Qinglin He and Qiuyan Liang and Quan Sun and Ran Sun and Rui Wang and Shaoliang Pang and Shiliang Yang and Sitong Liu and Siqi Liu and Shuli Gao and Tiancheng Cao and Tianyu Wang and Weipeng Ming and Wenqing He and Xu Zhao and Xuelin Zhang and Xianfang Zeng and Xiaojia Liu and Xuan Yang and Yaqi Dai and Yanbo Yu and Yang Li and Yineng Deng and Yingming Wang and Yilei Wang and Yuanwei Lu and Yu Chen and Yu Luo and Yuchu Luo and Yuhe Yin and Yuheng Feng and Yuxiang Yang and Zecheng Tang and Zekai Zhang and Zidong Yang and Binxing Jiao and Jiansheng Chen and Jing Li and Shuchang Zhou and Xiangyu Zhang and Xinhao Zhang and Yibo Zhu and Heung-Yeung Shum and Daxin Jiang},\n", + " year={2025},\n", + " eprint={2502.10248},\n", + " archivePrefix={arXiv},\n", + " primaryClass={cs.CV},\n", + " url={https://arxiv.org/abs/2502.10248}, \n", + " }" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "AI PC Samples", + "language": "python", + "name": "ai_pc_samples" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.12.10" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/3796f63e-da6e-45c5-bba9-dcb86401dc45/data_level0.bin b/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/3796f63e-da6e-45c5-bba9-dcb86401dc45/data_level0.bin new file mode 100644 index 0000000..09cffb6 Binary files /dev/null and b/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/3796f63e-da6e-45c5-bba9-dcb86401dc45/data_level0.bin differ diff --git a/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/3796f63e-da6e-45c5-bba9-dcb86401dc45/header.bin b/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/3796f63e-da6e-45c5-bba9-dcb86401dc45/header.bin new file mode 100644 index 0000000..e85f465 Binary files /dev/null and b/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/3796f63e-da6e-45c5-bba9-dcb86401dc45/header.bin differ diff --git a/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/3796f63e-da6e-45c5-bba9-dcb86401dc45/length.bin b/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/3796f63e-da6e-45c5-bba9-dcb86401dc45/length.bin new file mode 100644 index 0000000..f79b7db Binary files /dev/null and b/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/3796f63e-da6e-45c5-bba9-dcb86401dc45/length.bin differ diff --git a/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/3796f63e-da6e-45c5-bba9-dcb86401dc45/link_lists.bin b/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/3796f63e-da6e-45c5-bba9-dcb86401dc45/link_lists.bin new file mode 100644 index 0000000..e69de29 diff --git a/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/chroma.sqlite3 b/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/chroma.sqlite3 new file mode 100644 index 0000000..e412276 Binary files /dev/null and b/Video-Description-Generation-Query-Retrieval/Video_descriptions_database_ollama/chroma.sqlite3 differ diff --git a/Video-Description-Generation-Query-Retrieval/pyproject.toml b/Video-Description-Generation-Query-Retrieval/pyproject.toml index c845aed..ab1863e 100644 --- a/Video-Description-Generation-Query-Retrieval/pyproject.toml +++ b/Video-Description-Generation-Query-Retrieval/pyproject.toml @@ -1,33 +1,18 @@ [project] -name = "video-description-generation-query-retrieval" +name = "video-rag-ollama" version = "0.1.0" -description = "Add your description here" -readme = "README.md" +description = "Video RAG application using Ollama vision models for semantic video search" +readme = "README_Ollama.md" requires-python = ">=3.12.0" dependencies = [ - "torch>=2.7.0", - "torchvision>=0.22.0", - "pytorch-triton-xpu>=3.3.0 ; sys_platform == 'win32' or sys_platform == 'linux'", - "jupyter>=1.1.1", + "ollama>=0.4.0", + "streamlit>=1.30.0", "chromadb>=1.0.12", - "huggingface_hub[hf_xet]>=0.32.3", - "qwen-vl-utils[decord]>=0.0.11", "sentence-transformers>=4.1.0", - "transformers>=4.52.4", -] - -[tool.uv.sources] -torch = [ - { index = "pytorch-xpu", marker = "sys_platform == 'win32' or sys_platform == 'linux'" }, -] -torchvision = [ - { index = "pytorch-xpu", marker = "sys_platform == 'win32' or sys_platform == 'linux'" }, -] -pytorch-triton-xpu = [ - { index = "pytorch-xpu", marker = "sys_platform == 'win32' or sys_platform == 'linux'" }, + "opencv-python>=4.8.0", + "numpy>=1.24.0", + "tqdm>=4.65.0", + "jupyter>=1.1.1", + "ipykernel>=6.25.0", + "ipywidgets>=8.1.0", ] - -[[tool.uv.index]] -name = "pytorch-xpu" -url = "https://download.pytorch.org/whl/xpu" -explicit = true diff --git a/Video-Description-Generation-Query-Retrieval/st_video_rag_demo.py b/Video-Description-Generation-Query-Retrieval/st_video_rag_demo.py new file mode 100644 index 0000000..24417e1 --- /dev/null +++ b/Video-Description-Generation-Query-Retrieval/st_video_rag_demo.py @@ -0,0 +1,731 @@ +import os +import base64 +import shutil +import logging +import chromadb +import warnings +import ollama +import cv2 +import streamlit as st +from sentence_transformers import SentenceTransformer + +warnings.filterwarnings("ignore") +logging.basicConfig(level=logging.INFO) + +# Configuration +OLLAMA_BASE_URL = "http://localhost:11434" +DATABASE_PATH = "./Video_descriptions_database_ollama" +COLLECTION_NAME = "Video_descriptions_ollama" +EMBEDDING_MODEL = "all-MiniLM-L6-v2" + +# Page config +st.set_page_config( + page_title="Video RAG with Ollama on Intel GPUs", + layout="wide", + initial_sidebar_state="expanded" +) + +# Custom CSS for better styling +st.markdown(""" + +""", unsafe_allow_html=True) + +st.markdown('
🎥 Video RAG: Semantic Video Search
', unsafe_allow_html=True) +st.markdown('
Powered by Ollama on Intel® Arc™ & Core™ Ultra Processors
', unsafe_allow_html=True) + +# Initialize session state +if "collection" not in st.session_state: + st.session_state.collection = None +if "embedding_model" not in st.session_state: + st.session_state.embedding_model = None +if "video_files" not in st.session_state: + st.session_state.video_files = [] +if "database_loaded" not in st.session_state: + st.session_state.database_loaded = False + +# Sidebar configuration +with st.sidebar: + st.markdown("### 🎥 Video RAG") + st.markdown("---") + + st.header("⚙️ Configuration") + + # Model selection - show all models + try: + response = ollama.list() + all_models = [model.model for model in response.models] + + if not all_models: + st.error("⚠️ No models found! Please pull a model:") + st.code("ollama pull llava", language="bash") + all_models = ["llava"] + + selected_model = st.selectbox( + "🤖 Model", + all_models, + key="vision_model" + ) + + model_lower = selected_model.lower() + vision_patterns = ['llava', 'llama3.2-vision', 'minicpm-v', 'qwen', 'cogvlm', 'bakllava'] + + if any(pattern in model_lower for pattern in vision_patterns): + if 'llava' in model_lower: + st.success("✅ Vision model") + elif 'llama3.2-vision' in model_lower: + st.info("💡 Vision model") + elif 'qwen' in model_lower: + st.success("✅ Vision model") + else: + st.info("💡 Vision model detected") + else: + st.warning("⚠️ This model may not support vision/images") + + except Exception as e: + st.warning(f"⚠️ Ollama not accessible: {e}") + st.info("Please ensure Ollama is running: `ollama serve`") + selected_model = "llava" + + max_tokens = 100 + temperature = 0.7 + + st.markdown("---") + + # Dataset configuration + st.subheader("📁 Dataset") + dataset_folder = st.text_input("Video Folder", ".") + max_videos = st.slider("Max Videos", 1, 128, 20) + + st.markdown("---") + + # Database info + st.subheader("🗄️ Database") + if os.path.exists(DATABASE_PATH): + st.success("✅ Database Ready") + if st.button("🔄 Reset Database", type="secondary"): + try: + shutil.rmtree(DATABASE_PATH) + st.success("Database reset!") + st.session_state.collection = None + st.session_state.database_loaded = False + st.rerun() + except Exception as e: + st.error(f"Error: {e}") + else: + st.info("💾 No database found") + + st.markdown("---") + st.markdown("### 🚀 Intel Optimizations") + st.markdown("✓ Intel Arc™ Graphics") + st.markdown("✓ Intel Core™ Ultra") + st.markdown("✓ Hardware Acceleration") + + +def encode_video_frame(video_path, frame_time=2.0): + """Extract and encode a frame from video.""" + try: + cap = cv2.VideoCapture(video_path) + if not cap.isOpened(): + return None + + fps = cap.get(cv2.CAP_PROP_FPS) + frame_number = int(frame_time * fps) + cap.set(cv2.CAP_PROP_POS_FRAMES, frame_number) + + ret, frame = cap.read() + cap.release() + + if not ret: + return None + + _, buffer = cv2.imencode('.jpg', frame) + frame_base64 = base64.b64encode(buffer).decode('utf-8') + return frame_base64 + except Exception as e: + logging.error(f"Frame encoding error: {e}") + return None + + +def generate_video_description_ollama(video_path, model, max_tokens=100, temperature=0.7): + """Generate video description using Ollama vision model.""" + try: + frame_base64 = encode_video_frame(video_path, frame_time=2.0) + + if not frame_base64: + return "Unable to process video" + + response = ollama.chat( + model=model, + messages=[{ + 'role': 'user', + 'content': 'Describe this video frame concisely for search. Include main subjects, actions, setting, and key visual details in 2-3 sentences.', + 'images': [frame_base64] + }], + options={ + 'num_predict': max_tokens, + 'temperature': temperature, + 'num_ctx': 2048, + 'num_gpu': 99 + } + ) + + message = response['message'] + description = message.get('content', '') + + if not description or len(description.strip()) == 0: + description = message.get('thinking', '') + + if not description or len(description.strip()) == 0: + return "Empty response from model" + + return description + except Exception as e: + logging.error(f"Description generation error: {e}") + return "Error generating description" + + +def get_video_paths(folder, max_count): + """Get video file paths from folder.""" + try: + video_extensions = ['.mp4', '.avi', '.mov', '.mkv', '.flv', '.wmv'] + video_files = [] + + folder_path = os.path.abspath(folder) + + for root, dirs, files in os.walk(folder_path): + video_files.extend([ + os.path.join(root, f) for f in files + if any(f.lower().endswith(ext) for ext in video_extensions) + ]) + + if len(video_files) > max_count: + video_files = video_files[:max_count] + + return video_files + except Exception as e: + logging.error(f"Error finding videos: {e}") + return [] + + +def initialize_database(): + """Initialize ChromaDB and embedding model.""" + try: + client = chromadb.PersistentClient(path=DATABASE_PATH) + collection = client.get_or_create_collection( + name=COLLECTION_NAME, + metadata={"hnsw:space": "cosine"} + ) + + embedding_model = SentenceTransformer(EMBEDDING_MODEL) + + return collection, embedding_model + except Exception as e: + error_msg = str(e) + + # Handle tenant connection issues + if "Could not connect to tenant" in error_msg or "default_tenant" in error_msg: + st.error(f"Database initialization error: {e}") + st.warning("⚠️ ChromaDB database is corrupted or incompatible.") + + if st.button("🔄 Reset Database", type="primary"): + try: + # Remove corrupted database + if os.path.exists(DATABASE_PATH): + shutil.rmtree(DATABASE_PATH) + st.success("✅ Database removed. Click 'Start Processing Videos' again.") + st.rerun() + except Exception as reset_error: + st.error(f"Failed to reset database: {reset_error}") + + st.info("💡 **To fix manually:**\n\n1. Close this app\n2. Delete folder: `Video_descriptions_database_ollama`\n3. Restart the app") + return None, None + else: + st.error(f"Database initialization error: {e}") + return None, None + + +def get_existing_descriptions(collection): + """Get existing descriptions from database.""" + try: + all_items = collection.get(include=["metadatas"]) + existing = {meta['video_filename']: True for meta in all_items['metadatas']} + return existing + except: + return {} + + +# Main tabs +tab1, tab2, tab3, tab4 = st.tabs(["🎬 Process Videos", "🔍 Search Videos", "📊 Architecture", "ℹ️ About"]) + +with tab1: + st.header("Process Videos and Build Knowledge Base") + + col1, col2, col3 = st.columns(3) + with col1: + st.markdown('

🤖 AI Model

Qwen Vision-Language

', unsafe_allow_html=True) + with col2: + st.markdown('

💾 Storage

ChromaDB Vector Store

', unsafe_allow_html=True) + with col3: + st.markdown('

🔍 Search

Semantic Similarity

', unsafe_allow_html=True) + + st.markdown("---") + + if st.button("🚀 Start Processing Videos", type="primary", use_container_width=True): + with st.spinner("Initializing AI models on Intel GPU..."): + collection, embedding_model = initialize_database() + + if collection is None: + st.error("Failed to initialize database") + st.stop() + + st.session_state.collection = collection + st.session_state.embedding_model = embedding_model + + with st.spinner("Scanning for video files..."): + video_files = get_video_paths(dataset_folder, max_videos) + + if not video_files: + st.error(f"❌ No video files found in '{os.path.abspath(dataset_folder)}'") + st.info("💡 Supported: .mp4, .avi, .mov, .mkv, .flv, .wmv") + st.stop() + + st.session_state.video_files = video_files + st.success(f"✅ Found {len(video_files)} videos") + + existing = get_existing_descriptions(collection) + st.info(f"📚 Database contains {len(existing)} existing descriptions") + + progress_bar = st.progress(0) + status_text = st.empty() + + processed = 0 + skipped = 0 + + for idx, video_file in enumerate(video_files): + video_filename = os.path.basename(video_file) + progress = (idx + 1) / len(video_files) + progress_bar.progress(progress) + status_text.text(f"Processing {idx + 1}/{len(video_files)}: {video_filename}") + + if video_filename in existing: + skipped += 1 + continue + + try: + description = generate_video_description_ollama(video_file, selected_model, max_tokens, temperature) + embedding = embedding_model.encode(description).tolist() + + collection.add( + embeddings=[embedding], + documents=[description], + metadatas=[{"video_filename": video_filename}], + ids=[video_file] + ) + + processed += 1 + + except Exception as e: + st.warning(f"Error processing {video_filename}: {e}") + + progress_bar.progress(1.0) + status_text.empty() + + st.success(f"✅ Processing Complete!") + col1, col2, col3 = st.columns(3) + col1.metric("Processed", processed, delta=processed) + col2.metric("Skipped", skipped) + col3.metric("Total in Database", collection.count()) + + st.session_state.database_loaded = True + st.balloons() + +with tab2: + st.header("Semantic Video Search") + + col1, col2, col3 = st.columns(3) + with col1: + st.markdown('

🔍 AI-Powered

Semantic Understanding

', unsafe_allow_html=True) + with col2: + st.markdown('

⚡ Lightning Fast

Vector Search

', unsafe_allow_html=True) + with col3: + st.markdown('

🎯 Accurate Results

Ranked by Relevance

', unsafe_allow_html=True) + + st.markdown("---") + + if not st.session_state.database_loaded: + if os.path.exists(DATABASE_PATH): + with st.spinner("Loading knowledge base..."): + collection, embedding_model = initialize_database() + if collection: + st.session_state.collection = collection + st.session_state.embedding_model = embedding_model + st.session_state.database_loaded = True + st.success(f"✅ Loaded {collection.count()} video descriptions") + + if not st.session_state.database_loaded: + st.warning("⚠️ Please process videos first") + else: + with st.expander("📋 View All Video Descriptions", expanded=False): + try: + collection = st.session_state.collection + all_data = collection.get(include=["documents", "metadatas"]) + + st.info(f"📊 Total videos: {len(all_data['documents'])}") + + for i, (doc, metadata) in enumerate(zip(all_data['documents'], all_data['metadatas'])): + st.markdown(f"**{i+1}. {metadata['video_filename']}**") + st.text(doc) + if i < len(all_data['documents']) - 1: + st.markdown("---") + except Exception as e: + st.error(f"Error loading descriptions: {e}") + + st.markdown("### 🔍 Enter Your Search Query") + query = st.text_input("", placeholder="e.g., person playing basketball, sunset over ocean, dog running in park", label_visibility="collapsed") + + col1, col2 = st.columns([3, 1]) + with col1: + st.caption("💡 Try: 'person', 'animal', 'outdoor scene', 'sports activity', or keywords from descriptions above") + with col2: + search_button = st.button("🔍 Search", type="primary", use_container_width=True) + + if search_button and query: + with st.spinner("Searching with AI..."): + try: + collection = st.session_state.collection + embedding_model = st.session_state.embedding_model + + query_embedding = embedding_model.encode(query).tolist() + + results = collection.query( + query_embeddings=[query_embedding], + n_results=3, + include=["documents", "metadatas", "distances"] + ) + + st.success("✅ Search Complete!") + st.balloons() + st.markdown(f"**Query:** *{query}*") + st.markdown("---") + + for i, (doc, metadata, distance) in enumerate(zip( + results['documents'][0], + results['metadatas'][0], + results['distances'][0] + )): + similarity_score = 1 - distance + video_path = results['ids'][0][i] + + if similarity_score > 0.7: + score_emoji = "🟢" + score_label = "Excellent Match" + elif similarity_score > 0.5: + score_emoji = "🟡" + score_label = "Good Match" + else: + score_emoji = "🟠" + score_label = "Moderate Match" + + with st.expander(f"{score_emoji} Result {i+1}: {metadata['video_filename']} - {score_label} ({similarity_score:.2%})", expanded=(i==0)): + col1, col2 = st.columns([3, 2]) + + with col1: + st.markdown("#### 📝 Video Description") + st.info(doc) + st.markdown("#### 📊 Similarity Metrics") + st.progress(similarity_score) + st.caption(f"Similarity Score: {similarity_score:.2%} | Distance: {distance:.3f}") + + with col2: + if os.path.exists(video_path): + st.markdown("#### 🎬 Video Preview") + st.video(video_path) + else: + st.warning("Video file not found") + + except Exception as e: + st.error(f"Search error: {e}") + +with tab3: + st.header("System Architecture") + + st.markdown(""" + ### Video RAG Pipeline on Intel Hardware + + This system demonstrates the power of Intel GPUs for AI workloads, using Ollama for efficient model inference. + """) + + # Clean architecture diagram using Streamlit columns + st.markdown("### 🔄 System Architecture Flow") + + st.info("**Video Processing Pipeline** - How videos are converted to searchable descriptions") + + cols = st.columns(7) + with cols[0]: + st.markdown("### 📹\n**Video Files**\nInput videos") + with cols[1]: + st.markdown("### ➡️") + with cols[2]: + st.markdown("### 🎞️\n**Extract Frame**\nOpenCV") + with cols[3]: + st.markdown("### ➡️") + with cols[4]: + st.markdown("### 🤖\n**Ollama Vision**\n:blue[Intel GPU]") + with cols[5]: + st.markdown("### ➡️") + with cols[6]: + st.markdown("### 📝\n**Description**\nText output") + + st.markdown("") + + cols2 = st.columns(5) + with cols2[0]: + st.markdown("### 📝\n**Description**") + with cols2[1]: + st.markdown("### ➡️") + with cols2[2]: + st.markdown("### 🔢\n**Embeddings**\n:blue[Transformers]") + with cols2[3]: + st.markdown("### ➡️") + with cols2[4]: + st.markdown("### 💾\n**ChromaDB**\nVector store") + + st.markdown("---") + + st.info("**Search Pipeline** - How queries find relevant videos") + + cols3 = st.columns(7) + with cols3[0]: + st.markdown("### 👤\n**User Query**\nNatural text") + with cols3[1]: + st.markdown("### ➡️") + with cols3[2]: + st.markdown("### 🔢\n**Embedding**\nVector form") + with cols3[3]: + st.markdown("### ➡️") + with cols3[4]: + st.markdown("### 🔍\n**Similarity**\n:blue[Cosine dist]") + with cols3[5]: + st.markdown("### ➡️") + with cols3[6]: + st.markdown("### 🎬\n**Results**\nMatched videos") + + st.markdown("---") + + # Architecture diagram + col1, col2 = st.columns(2) + + with col1: + st.markdown("### 🎯 Key Components") + st.markdown(""" + **1. Video Processing** + - Frame extraction with OpenCV + - Vision model inference on Intel GPU + - Description generation + + **2. Embedding Generation** + - Sentence Transformers + - 384-dimensional vectors + - Semantic representation + + **3. Vector Storage** + - ChromaDB persistent storage + - Cosine similarity metric + - Efficient retrieval + """) + + with col2: + st.markdown("### 🚀 Intel Optimizations") + st.markdown(""" + **Hardware Acceleration** + - Intel Arc™ Graphics + - Intel Core™ Ultra Processors + - Intel Iris® Xe Graphics + + **Performance Benefits** + - Fast inference times + - Efficient memory usage + - Local processing + + **Ollama Integration** + - Optimized for Intel hardware + - Easy model management + - Production-ready + """) + + st.markdown("---") + + # Technical details + st.markdown("### 🔧 Technical Stack") + + col1, col2, col3 = st.columns(3) + + with col1: + st.markdown(""" + **AI Models** + - Qwen 2.5 VL + - Llama 3.2 Vision + - MiniLM Embeddings + """) + + with col2: + st.markdown(""" + **Infrastructure** + - Ollama Runtime + - ChromaDB + - Streamlit UI + """) + + with col3: + st.markdown(""" + **Intel Hardware** + - Arc™ GPUs + - Core™ Ultra CPUs + - Iris® Xe Graphics + """) + +with tab4: + st.header("About This Demo") + + st.markdown(""" + ### 🎯 Video RAG with Ollama on Intel GPUs + + This application demonstrates **semantic video search** powered by **Ollama on Intel GPUs**. + It combines vision-language models, vector embeddings, and similarity search to enable + natural language queries over video content and detailed image understanding. + + ### 💡 Use Cases + + - **Video Libraries**: Quickly find specific content in large video collections + - **Content Management**: Search videos by describing what you're looking for + - **Surveillance**: Locate specific events or activities in footage + - **Education**: Find relevant video segments for learning materials + - **Media Production**: Search stock footage by description + + ### 🏗️ How It Works + + 1. **Extract**: Take representative frames from videos + 2. **Describe**: Use AI vision models to generate detailed descriptions + 3. **Embed**: Convert descriptions to semantic vectors + 4. **Store**: Save vectors in a searchable database + 5. **Query**: Search using natural language + 6. **Retrieve**: Find most similar videos by semantic meaning + + ### 🚀 Why Intel GPUs? + + - **Performance**: Fast inference for vision models + - **Efficiency**: Optimized power consumption + - **Accessibility**: Available on mainstream devices + - **Local Processing**: No cloud dependency + - **Cost Effective**: Use existing hardware + """) + + st.markdown("---") + + st.markdown("### 🛠️ Technology Stack") + + st.code(""" + # Core Technologies + - Ollama: Local LLM runtime optimized for Intel GPUs + - Qwen 2.5 VL: State-of-the-art vision-language model + - ChromaDB: Efficient vector database + - Sentence Transformers: Text embedding generation + - Streamlit: Interactive web interface + + # Intel Optimizations + - Hardware acceleration on Arc and Iris Xe + - Optimized inference on Core Ultra processors + - Local processing without cloud dependency + """, language="python") + + st.markdown("---") + + # System status + st.markdown("### 📡 System Status") + + col1, col2, col3 = st.columns(3) + + with col1: + try: + ollama.list() + st.success("✅ Ollama Connected") + except: + st.error("❌ Ollama Offline") + + with col2: + if os.path.exists(DATABASE_PATH): + st.success(f"✅ Database Active") + else: + st.info("💾 Database Not Created") + + with col3: + if st.session_state.database_loaded: + st.success(f"✅ {st.session_state.collection.count()} Videos Indexed") + else: + st.info("⏳ Awaiting Processing") + +# Footer +st.markdown("---") +st.markdown( + '
' + '

🎥 Video RAG Demo | Powered by Ollama on ' + 'Intel Arc Graphics and Intel Core Ultra Processors

' + '
', + unsafe_allow_html=True +) diff --git a/Video-Description-Generation-Query-Retrieval/st_video_rag_demo_final.py b/Video-Description-Generation-Query-Retrieval/st_video_rag_demo_final.py new file mode 100644 index 0000000..293bb0e --- /dev/null +++ b/Video-Description-Generation-Query-Retrieval/st_video_rag_demo_final.py @@ -0,0 +1,701 @@ +import os +import base64 +import shutil +import logging +import chromadb +import warnings +import ollama +import cv2 +import streamlit as st +from sentence_transformers import SentenceTransformer + +warnings.filterwarnings("ignore") +logging.basicConfig(level=logging.INFO) + +# Configuration +OLLAMA_BASE_URL = "http://localhost:11434" +DATABASE_PATH = "./Video_descriptions_database_ollama" +COLLECTION_NAME = "Video_descriptions_ollama" +EMBEDDING_MODEL = "all-MiniLM-L6-v2" + +# Page config +st.set_page_config( + page_title="Video RAG with Ollama", + layout="wide", + initial_sidebar_state="expanded" +) + +# Custom CSS for better styling +st.markdown(""" + +""", unsafe_allow_html=True) + +st.markdown('
🎥 Video RAG: Semantic Video Search
', unsafe_allow_html=True) +st.markdown('
Powered by Ollama on Intel® Core™ Ultra Processors
', unsafe_allow_html=True) + +# Initialize session state +if "collection" not in st.session_state: + st.session_state.collection = None +if "embedding_model" not in st.session_state: + st.session_state.embedding_model = None +if "video_files" not in st.session_state: + st.session_state.video_files = [] +if "database_loaded" not in st.session_state: + st.session_state.database_loaded = False + +# Sidebar configuration +with st.sidebar: + st.markdown("### 🎥 Video RAG") + st.markdown("---") + + st.header("⚙️ Configuration") + + # Model selection + try: + response = ollama.list() + all_models = [model.model for model in response.models] + + if not all_models: + st.error("⚠️ No models found! Please pull a model:") + st.code("ollama pull llava", language="bash") + all_models = ["llava"] + + selected_model = st.selectbox( + "🤖 Model", + all_models, + key="vision_model" + ) + + model_lower = selected_model.lower() + vision_patterns = ['llava', 'llama3.2-vision', 'minicpm-v', 'qwen', 'cogvlm', 'bakllava'] + + if any(pattern in model_lower for pattern in vision_patterns): + if 'llava' in model_lower: + st.success("✅ Vision model") + elif 'llama3.2-vision' in model_lower: + st.info("💡 Vision model") + elif 'qwen' in model_lower: + st.success("✅ Vision model") + else: + st.info("💡 Vision model detected") + else: + st.warning("⚠️ This model may not support vision/images") + + except Exception as e: + st.warning(f"⚠️ Ollama not accessible: {e}") + st.info("Please ensure Ollama is running: `ollama serve`") + selected_model = "llava" + + max_tokens = 100 + temperature = 0.7 + + st.markdown("---") + + # Dataset configuration + st.subheader("📁 Dataset") + dataset_folder = st.text_input("Video Folder", "Step-Video-T2V-Eval") + max_videos = st.slider("Max Videos", 1, 128, 20) + + st.markdown("---") + + # Database info + st.subheader("🗄️ Database") + if os.path.exists(DATABASE_PATH): + st.success("✅ Database Ready") + if st.button("🔄 Reset Database", type="secondary"): + try: + shutil.rmtree(DATABASE_PATH) + st.success("Database reset!") + st.session_state.collection = None + st.session_state.database_loaded = False + st.rerun() + except Exception as e: + st.error(f"Error: {e}") + else: + st.info("💾 No database found") + + +def encode_video_frame(video_path, frame_time=2.0): + """Extract and encode a frame from video.""" + try: + cap = cv2.VideoCapture(video_path) + if not cap.isOpened(): + return None + + fps = cap.get(cv2.CAP_PROP_FPS) + frame_number = int(frame_time * fps) + cap.set(cv2.CAP_PROP_POS_FRAMES, frame_number) + + ret, frame = cap.read() + cap.release() + + if not ret: + return None + + _, buffer = cv2.imencode('.jpg', frame) + frame_base64 = base64.b64encode(buffer).decode('utf-8') + return frame_base64 + except Exception as e: + logging.error(f"Frame encoding error: {e}") + return None + + +def generate_video_description_ollama(video_path, model, max_tokens=100, temperature=0.7): + """Generate video description using Ollama vision model.""" + try: + frame_base64 = encode_video_frame(video_path, frame_time=2.0) + + if not frame_base64: + st.warning(f"⚠️ Failed to extract frame from {os.path.basename(video_path)}") + return "Unable to process video" + + response = ollama.chat( + model=model, + messages=[{ + 'role': 'user', + 'content': 'Describe this video frame concisely for search. Include main subjects, actions, setting, and key visual details in 2-3 sentences.', + 'images': [frame_base64] + }], + options={ + 'num_predict': max_tokens, + 'temperature': temperature, + 'num_ctx': 2048, + 'num_gpu': 99 + } + ) + + message = response['message'] + description = message.get('content', '') + + if not description or len(description.strip()) == 0: + description = message.get('thinking', '') + + if not description or len(description.strip()) == 0: + st.error(f"❌ Empty response from model for {os.path.basename(video_path)}") + return "Empty response from model" + + st.success(f"✅ {os.path.basename(video_path)}: {description[:80]}...") + return description + except Exception as e: + logging.error(f"Description generation error: {e}") + st.error(f"❌ Error: {str(e)}") + return "Error generating description" + + +def get_video_paths(folder, max_count): + """Get video file paths from folder.""" + try: + video_extensions = ['.mp4', '.avi', '.mov', '.mkv', '.flv', '.wmv'] + video_files = [] + + folder_path = os.path.abspath(folder) + + for root, dirs, files in os.walk(folder_path): + video_files.extend([ + os.path.join(root, f) for f in files + if any(f.lower().endswith(ext) for ext in video_extensions) + ]) + + if len(video_files) > max_count: + video_files = video_files[:max_count] + + return video_files + except Exception as e: + logging.error(f"Error finding videos: {e}") + return [] + + +def initialize_database(): + """Initialize ChromaDB and embedding model.""" + try: + client = chromadb.PersistentClient(path=DATABASE_PATH) + collection = client.get_or_create_collection( + name=COLLECTION_NAME, + metadata={"hnsw:space": "cosine"} + ) + + embedding_model = SentenceTransformer(EMBEDDING_MODEL) + + return collection, embedding_model + except Exception as e: + error_msg = str(e) + + if "Could not connect to tenant" in error_msg or "default_tenant" in error_msg: + st.error(f"Database initialization error: {e}") + st.warning("⚠️ ChromaDB database is corrupted or incompatible.") + + if st.button("🔄 Reset Database", type="primary"): + try: + if os.path.exists(DATABASE_PATH): + shutil.rmtree(DATABASE_PATH) + st.success("✅ Database removed. Click 'Start Processing Videos' again.") + st.rerun() + except Exception as reset_error: + st.error(f"Failed to reset database: {reset_error}") + + st.info("💡 **To fix manually:**\n\n1. Close this app\n2. Delete folder: `Video_descriptions_database_ollama`\n3. Restart the app") + return None, None + else: + st.error(f"Database initialization error: {e}") + return None, None + + +def get_existing_descriptions(collection): + """Get existing descriptions from database.""" + try: + all_items = collection.get(include=["metadatas"]) + existing = {meta['video_filename']: True for meta in all_items['metadatas']} + return existing + except: + return {} + + +# Main tabs +tab1, tab2, tab3, tab4 = st.tabs(["🎬 Process Videos", "🔍 Search Videos", "📊 Architecture", "ℹ️ About"]) + +with tab1: + st.header("Process Videos and Build Knowledge Base") + + col1, col2, col3 = st.columns(3) + with col1: + st.markdown('

🤖 AI Model

Vision-Language Models

', unsafe_allow_html=True) + with col2: + st.markdown('

💾 Storage

ChromaDB Vector Store

', unsafe_allow_html=True) + with col3: + st.markdown('

🔍 Search

Semantic Similarity

', unsafe_allow_html=True) + + st.markdown("---") + + if st.button("🚀 Start Processing Videos", type="primary", use_container_width=True): + with st.spinner("Initializing AI models..."): + collection, embedding_model = initialize_database() + + if collection is None: + st.error("Failed to initialize database") + st.stop() + + st.session_state.collection = collection + st.session_state.embedding_model = embedding_model + + with st.spinner("Scanning for video files..."): + video_files = get_video_paths(dataset_folder, max_videos) + + if not video_files: + st.error(f"❌ No video files found in '{os.path.abspath(dataset_folder)}'") + st.info("💡 Supported: .mp4, .avi, .mov, .mkv, .flv, .wmv") + st.stop() + + st.session_state.video_files = video_files + st.success(f"✅ Found {len(video_files)} videos") + + existing = get_existing_descriptions(collection) + st.info(f"📚 Database contains {len(existing)} existing descriptions") + + progress_bar = st.progress(0) + status_text = st.empty() + + processed = 0 + skipped = 0 + + for idx, video_file in enumerate(video_files): + video_filename = os.path.basename(video_file) + progress = (idx + 1) / len(video_files) + progress_bar.progress(progress) + status_text.text(f"Processing {idx + 1}/{len(video_files)}: {video_filename}") + + if video_filename in existing: + skipped += 1 + continue + + try: + description = generate_video_description_ollama(video_file, selected_model, max_tokens, temperature) + embedding = embedding_model.encode(description).tolist() + + collection.add( + embeddings=[embedding], + documents=[description], + metadatas=[{"video_filename": video_filename}], + ids=[video_file] + ) + + processed += 1 + + except Exception as e: + st.warning(f"Error processing {video_filename}: {e}") + + progress_bar.progress(1.0) + status_text.empty() + + st.success(f"✅ Processing Complete!") + col1, col2, col3 = st.columns(3) + col1.metric("Processed", processed, delta=processed) + col2.metric("Skipped", skipped) + col3.metric("Total in Database", collection.count()) + + st.session_state.database_loaded = True + st.balloons() + +with tab2: + st.header("Semantic Video Search") + + col1, col2, col3 = st.columns(3) + with col1: + st.markdown('

🔍 AI-Powered

Semantic Understanding

', unsafe_allow_html=True) + with col2: + st.markdown('

⚡ Lightning Fast

Vector Search

', unsafe_allow_html=True) + with col3: + st.markdown('

🎯 Accurate Results

Ranked by Relevance

', unsafe_allow_html=True) + + st.markdown("---") + + if not st.session_state.database_loaded: + if os.path.exists(DATABASE_PATH): + with st.spinner("Loading knowledge base..."): + collection, embedding_model = initialize_database() + if collection: + st.session_state.collection = collection + st.session_state.embedding_model = embedding_model + st.session_state.database_loaded = True + st.success(f"✅ Loaded {collection.count()} video descriptions") + + if not st.session_state.database_loaded: + st.warning("⚠️ Please process videos first") + else: + with st.expander("📋 View All Video Descriptions", expanded=False): + try: + collection = st.session_state.collection + all_data = collection.get(include=["documents", "metadatas"]) + + st.info(f"📊 Total videos: {len(all_data['documents'])}") + + for i, (doc, metadata) in enumerate(zip(all_data['documents'], all_data['metadatas'])): + st.markdown(f"**{i+1}. {metadata['video_filename']}**") + st.text(doc) + if i < len(all_data['documents']) - 1: + st.markdown("---") + except Exception as e: + st.error(f"Error loading descriptions: {e}") + + st.markdown("### 🔍 Enter Your Search Query") + query = st.text_input("", placeholder="e.g., person playing basketball, sunset over ocean, dog running in park", label_visibility="collapsed") + + col1, col2 = st.columns([3, 1]) + with col1: + st.caption("💡 Try: 'person', 'animal', 'outdoor scene', 'sports activity', or keywords from descriptions above") + with col2: + search_button = st.button("🔍 Search", type="primary", use_container_width=True) + + if search_button and query: + with st.spinner("Searching with AI..."): + try: + collection = st.session_state.collection + embedding_model = st.session_state.embedding_model + + query_embedding = embedding_model.encode(query).tolist() + + results = collection.query( + query_embeddings=[query_embedding], + n_results=3, + include=["documents", "metadatas", "distances"] + ) + + st.success("✅ Search Complete!") + st.balloons() + st.markdown(f"**Query:** *{query}*") + st.markdown("---") + + for i, (doc, metadata, distance) in enumerate(zip( + results['documents'][0], + results['metadatas'][0], + results['distances'][0] + )): + similarity_score = 1 - distance + video_path = results['ids'][0][i] + + if similarity_score > 0.7: + score_emoji = "🟢" + score_label = "Excellent Match" + elif similarity_score > 0.5: + score_emoji = "🟡" + score_label = "Good Match" + else: + score_emoji = "🟠" + score_label = "Moderate Match" + + with st.expander(f"{score_emoji} Result {i+1}: {metadata['video_filename']} - {score_label} ({similarity_score:.2%})", expanded=(i==0)): + col1, col2 = st.columns([3, 2]) + + with col1: + st.markdown("#### 📝 Video Description") + st.info(doc) + st.markdown("#### 📊 Similarity Metrics") + st.progress(similarity_score) + st.caption(f"Similarity Score: {similarity_score:.2%} | Distance: {distance:.3f}") + + with col2: + if os.path.exists(video_path): + st.markdown("#### 🎬 Video Preview") + st.video(video_path) + else: + st.warning("Video file not found") + + except Exception as e: + st.error(f"Search error: {e}") + +with tab3: + st.header("System Architecture") + + st.markdown(""" + ### Video RAG Pipeline + + This system demonstrates semantic video search using vision-language models and vector embeddings. + """) + + st.markdown("### 🔄 System Architecture Flow") + + st.info("**Video Processing Pipeline** - How videos are converted to searchable descriptions") + + cols = st.columns(7) + with cols[0]: + st.markdown("### 📹\n**Video Files**\nInput videos") + with cols[1]: + st.markdown("### ➡️") + with cols[2]: + st.markdown("### 🎞️\n**Extract Frame**\nOpenCV") + with cols[3]: + st.markdown("### ➡️") + with cols[4]: + st.markdown("### 🤖\n**Ollama Vision**\nModel inference") + with cols[5]: + st.markdown("### ➡️") + with cols[6]: + st.markdown("### 📝\n**Description**\nText output") + + st.markdown("") + + cols2 = st.columns(5) + with cols2[0]: + st.markdown("### 📝\n**Description**") + with cols2[1]: + st.markdown("### ➡️") + with cols2[2]: + st.markdown("### 🔢\n**Embeddings**\nTransformers") + with cols2[3]: + st.markdown("### ➡️") + with cols2[4]: + st.markdown("### 💾\n**ChromaDB**\nVector store") + + st.markdown("---") + + st.info("**Search Pipeline** - How queries find relevant videos") + + cols3 = st.columns(7) + with cols3[0]: + st.markdown("### 👤\n**User Query**\nNatural text") + with cols3[1]: + st.markdown("### ➡️") + with cols3[2]: + st.markdown("### 🔢\n**Embedding**\nVector form") + with cols3[3]: + st.markdown("### ➡️") + with cols3[4]: + st.markdown("### 🔍\n**Similarity**\nCosine dist") + with cols3[5]: + st.markdown("### ➡️") + with cols3[6]: + st.markdown("### 🎬\n**Results**\nMatched videos") + + st.markdown("---") + + col1, col2 = st.columns(2) + + with col1: + st.markdown("### 🎯 Key Components") + st.markdown(""" + **1. Video Processing** + - Frame extraction with OpenCV + - Vision model inference + - Description generation + + **2. Embedding Generation** + - Sentence Transformers + - 384-dimensional vectors + - Semantic representation + + **3. Vector Storage** + - ChromaDB persistent storage + - Cosine similarity metric + - Efficient retrieval + """) + + with col2: + st.markdown("### 🚀 Features") + st.markdown(""" + **Performance** + - Fast inference times + - Efficient memory usage + - Local processing + + **Capabilities** + - Natural language search + - Semantic understanding + - Multi-modal analysis + + **Integration** + - Ollama runtime + - Easy model management + - Production-ready + """) + + st.markdown("---") + + st.markdown("### 🔧 Technical Stack") + + col1, col2, col3 = st.columns(3) + + with col1: + st.markdown(""" + **AI Models** + - Qwen Vision-Language + - Llama Vision + - MiniLM Embeddings + """) + + with col2: + st.markdown(""" + **Infrastructure** + - Ollama Runtime + - ChromaDB + - Streamlit UI + """) + + with col3: + st.markdown(""" + **Processing** + - OpenCV + - Sentence Transformers + - Python Backend + """) + +with tab4: + st.header("About This Demo") + + st.markdown(""" + ### 🎯 Video RAG with Ollama + + This application demonstrates **semantic video search** powered by **Ollama**. + It combines vision-language models, vector embeddings, and similarity search to enable + natural language queries over video content. + + ### 💡 Use Cases + + - **Video Libraries**: Quickly find specific content in large video collections + - **Content Management**: Search videos by describing what you're looking for + - **Surveillance**: Locate specific events or activities in footage + - **Education**: Find relevant video segments for learning materials + - **Media Production**: Search stock footage by description + + ### 🏗️ How It Works + + 1. **Extract**: Take representative frames from videos + 2. **Describe**: Use AI vision models to generate detailed descriptions + 3. **Embed**: Convert descriptions to semantic vectors + 4. **Store**: Save vectors in a searchable database + 5. **Query**: Search using natural language + 6. **Retrieve**: Find most similar videos by semantic meaning + """) + + st.markdown("---") + + st.markdown("### 🛠️ Technology Stack") + + st.code(""" + # Core Technologies + - Ollama: Local LLM runtime + - Vision-Language Models: Qwen, Llama, etc. + - ChromaDB: Efficient vector database + - Sentence Transformers: Text embedding generation + - Streamlit: Interactive web interface + - OpenCV: Video frame extraction + """, language="python") + + st.markdown("---") + + st.markdown("### 📡 System Status") + + col1, col2, col3 = st.columns(3) + + with col1: + try: + ollama.list() + st.success("✅ Ollama Connected") + except: + st.error("❌ Ollama Offline") + + with col2: + if os.path.exists(DATABASE_PATH): + st.success(f"✅ Database Active") + else: + st.info("💾 Database Not Created") + + with col3: + if st.session_state.database_loaded: + st.success(f"✅ {st.session_state.collection.count()} Videos Indexed") + else: + st.info("⏳ Awaiting Processing") + +# Footer +st.markdown("---") +st.markdown( + '
' + '

🎥 Video RAG Demo | Powered by Ollama

' + '
', + unsafe_allow_html=True +) diff --git a/Video-Description-Generation-Query-Retrieval/uv.lock b/Video-Description-Generation-Query-Retrieval/uv.lock index 822c84a..8dde654 100644 --- a/Video-Description-Generation-Query-Retrieval/uv.lock +++ b/Video-Description-Generation-Query-Retrieval/uv.lock @@ -1,13 +1,25 @@ version = 1 -revision = 2 +revision = 3 requires-python = ">=3.12.0" resolution-markers = [ - "python_full_version >= '3.13' and sys_platform == 'linux'", - "python_full_version < '3.13' and sys_platform == 'linux'", - "python_full_version >= '3.13' and sys_platform == 'win32'", - "python_full_version < '3.13' and sys_platform == 'win32'", - "python_full_version >= '3.13' and sys_platform != 'linux' and sys_platform != 'win32'", - "python_full_version < '3.13' and sys_platform != 'linux' and sys_platform != 'win32'", + "python_full_version >= '3.13'", + "python_full_version < '3.13'", +] + +[[package]] +name = "altair" +version = "5.5.0" +source = { registry = "https://pypi.org/simple" } +dependencies = [ + { name = "jinja2" }, + { name = "jsonschema" }, + { name = "narwhals" }, + { name = "packaging" }, + { name = "typing-extensions", marker = "python_full_version < '3.14'" }, +] +sdist = { url = "https://files.pythonhosted.org/packages/16/b1/f2969c7bdb8ad8bbdda031687defdce2c19afba2aa2c8e1d2a17f78376d8/altair-5.5.0.tar.gz", hash = "sha256:d960ebe6178c56de3855a68c47b516be38640b73fb3b5111c2a9ca90546dd73d", size = 705305, upload-time = "2024-11-23T23:39:58.542Z" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/aa/f3/0b6ced594e51cc95d8c1fc1640d3623770d01e4969d29c0bd09945fafefa/altair-5.5.0-py3-none-any.whl", hash = "sha256:91a310b926508d560fe0148d02a194f38b824122641ef528113d029fcd129f8c", size = 731200, upload-time = "2024-11-23T23:39:56.4Z" }, ] [[package]] @@ -115,32 +127,6 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/77/06/bb80f5f86020c4551da315d78b3ab75e8228f89f0162f2c3a819e407941a/attrs-25.3.0-py3-none-any.whl", hash = "sha256:427318ce031701fea540783410126f03899a97ffc6f61596ad581ac2e40e3bc3", size = 63815, upload-time = "2025-03-13T11:10:21.14Z" }, ] -[[package]] -name = "av" -version = "14.4.0" -source = { registry = "https://pypi.org/simple" } -sdist = { url = "https://files.pythonhosted.org/packages/86/f6/0b473dab52dfdea05f28f3578b1c56b6c796ce85e76951bab7c4e38d5a74/av-14.4.0.tar.gz", hash = "sha256:3ecbf803a7fdf67229c0edada0830d6bfaea4d10bfb24f0c3f4e607cd1064b42", size = 3892203, upload-time = "2025-05-16T19:13:35.737Z" } -wheels = [ - { url = "https://files.pythonhosted.org/packages/a6/75/b8641653780336c90ba89e5352cac0afa6256a86a150c7703c0b38851c6d/av-14.4.0-cp312-cp312-macosx_12_0_arm64.whl", hash = "sha256:a53e682b239dd23b4e3bc9568cfb1168fc629ab01925fdb2e7556eb426339e94", size = 19954125, upload-time = "2025-05-16T19:09:54.909Z" }, - { url = "https://files.pythonhosted.org/packages/99/e6/37fe6fa5853a48d54d749526365780a63a4bc530be6abf2115e3a21e292a/av-14.4.0-cp312-cp312-macosx_12_0_x86_64.whl", hash = "sha256:5aa0b901751a32703fa938d2155d56ce3faf3630e4a48d238b35d2f7e49e5395", size = 23751479, upload-time = "2025-05-16T19:09:57.113Z" }, - { url = "https://files.pythonhosted.org/packages/f7/75/9a5f0e6bda5f513b62bafd1cff2b495441a8b07ab7fb7b8e62f0c0d1683f/av-14.4.0-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:a3b316fed3597675fe2aacfed34e25fc9d5bb0196dc8c0b014ae5ed4adda48de", size = 33801401, upload-time = "2025-05-16T19:09:59.479Z" }, - { url = "https://files.pythonhosted.org/packages/6a/c9/e4df32a2ad1cb7f3a112d0ed610c5e43c89da80b63c60d60e3dc23793ec0/av-14.4.0-cp312-cp312-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:a587b5c5014c3c0e16143a0f8d99874e46b5d0c50db6111aa0b54206b5687c81", size = 32364330, upload-time = "2025-05-16T19:10:02.111Z" }, - { url = "https://files.pythonhosted.org/packages/ca/f0/64e7444a41817fde49a07d0239c033f7e9280bec4a4bb4784f5c79af95e6/av-14.4.0-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:10d53f75e8ac1ec8877a551c0db32a83c0aaeae719d05285281eaaba211bbc30", size = 35519508, upload-time = "2025-05-16T19:10:05.008Z" }, - { url = "https://files.pythonhosted.org/packages/c2/a8/a370099daa9033a3b6f9b9bd815304b3d8396907a14d09845f27467ba138/av-14.4.0-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:c8558cfde79dd8fc92d97c70e0f0fa8c94c7a66f68ae73afdf58598f0fe5e10d", size = 36448593, upload-time = "2025-05-16T19:10:07.887Z" }, - { url = "https://files.pythonhosted.org/packages/27/bb/edb6ceff8fa7259cb6330c51dbfbc98dd1912bd6eb5f7bc05a4bb14a9d6e/av-14.4.0-cp312-cp312-musllinux_1_2_i686.whl", hash = "sha256:455b6410dea0ab2d30234ffb28df7d62ca3cdf10708528e247bec3a4cdcced09", size = 34701485, upload-time = "2025-05-16T19:10:10.886Z" }, - { url = "https://files.pythonhosted.org/packages/a7/8a/957da1f581aa1faa9a5dfa8b47ca955edb47f2b76b949950933b457bfa1d/av-14.4.0-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:1661efbe9d975f927b8512d654704223d936f39016fad2ddab00aee7c40f412c", size = 37521981, upload-time = "2025-05-16T19:10:13.678Z" }, - { url = "https://files.pythonhosted.org/packages/28/76/3f1cf0568592f100fd68eb40ed8c491ce95ca3c1378cc2d4c1f6d1bd295d/av-14.4.0-cp312-cp312-win_amd64.whl", hash = "sha256:fbbeef1f421a3461086853d6464ad5526b56ffe8ccb0ab3fd0a1f121dfbf26ad", size = 27925944, upload-time = "2025-05-16T19:10:16.485Z" }, - { url = "https://files.pythonhosted.org/packages/12/4c/b0205f77352312ff457ecdf31723dbf4403b7a03fc1659075d6d32f23ef7/av-14.4.0-cp313-cp313-macosx_12_0_arm64.whl", hash = "sha256:3d2aea7c602b105363903e4017103bc4b60336e7aff80e1c22e8b4ec09fd125f", size = 19917341, upload-time = "2025-05-16T19:10:18.826Z" }, - { url = "https://files.pythonhosted.org/packages/e1/c4/9e783bd7d47828e9c67f9c773c99de45c5ae01b3e942f1abf6cbaf530267/av-14.4.0-cp313-cp313-macosx_12_0_x86_64.whl", hash = "sha256:38c18f036aeb6dc9abf5e867d998c867f9ec93a5f722b60721fdffc123bbb2ae", size = 23715363, upload-time = "2025-05-16T19:10:21.42Z" }, - { url = "https://files.pythonhosted.org/packages/b5/26/b2b406a676864d06b1c591205782d8527e7c99e5bc51a09862c3576e0087/av-14.4.0-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:58c1e18c8be73b6eada2d9ec397852ec74ebe51938451bdf83644a807189d6c8", size = 33496968, upload-time = "2025-05-16T19:10:24.178Z" }, - { url = "https://files.pythonhosted.org/packages/89/09/0a032bbe30c7049fca243ec8cf01f4be49dd6e7f7b9c3c7f0cc13f83c9d3/av-14.4.0-cp313-cp313-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:e4c32ff03a357feb030634f093089a73cb474b04efe7fbfba31f229cb2fab115", size = 32075498, upload-time = "2025-05-16T19:10:27.384Z" }, - { url = "https://files.pythonhosted.org/packages/0b/1f/0fee20f74c1f48086366e59dbd37fa0684cd0f3c782a65cbb719d26c7acd/av-14.4.0-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:af31d16ae25964a6a02e09cc132b9decd5ee493c5dcb21bcdf0d71b2d6adbd59", size = 35224910, upload-time = "2025-05-16T19:10:30.104Z" }, - { url = "https://files.pythonhosted.org/packages/9e/19/1c4a201c75a2a431a85a43fd15d1fad55a28c22d596461d861c8d70f9b92/av-14.4.0-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:e9fb297009e528f4851d25f3bb2781b2db18b59b10aed10240e947b77c582fb7", size = 36172918, upload-time = "2025-05-16T19:10:32.789Z" }, - { url = "https://files.pythonhosted.org/packages/00/48/26b7e5d911c807f5f017a285362470ba16f44e8ea46f8b09ab5e348dd15b/av-14.4.0-cp313-cp313-musllinux_1_2_i686.whl", hash = "sha256:573314cb9eafec2827dc98c416c965330dc7508193adbccd281700d8673b9f0a", size = 34414492, upload-time = "2025-05-16T19:10:36.023Z" }, - { url = "https://files.pythonhosted.org/packages/6d/26/2f4badfa5b5b7b8f5f83d562b143a83ed940fa458eea4cad495ce95c9741/av-14.4.0-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:f82ab27ee57c3b80eb50a5293222307dfdc02f810ea41119078cfc85ea3cf9a8", size = 37245826, upload-time = "2025-05-16T19:10:39.562Z" }, - { url = "https://files.pythonhosted.org/packages/f4/02/88dbb6f5a05998b730d2e695b05060297af127ac4250efbe0739daa446d5/av-14.4.0-cp313-cp313-win_amd64.whl", hash = "sha256:9f682003bbcaac620b52f68ff0e85830fff165dea53949e217483a615993ca20", size = 27898395, upload-time = "2025-05-16T19:13:02.653Z" }, -] - [[package]] name = "babel" version = "2.17.0" @@ -239,12 +225,21 @@ css = [ { name = "tinycss2" }, ] +[[package]] +name = "blinker" +version = "1.9.0" +source = { registry = "https://pypi.org/simple" } +sdist = { url = "https://files.pythonhosted.org/packages/21/28/9b3f50ce0e048515135495f198351908d99540d69bfdc8c1d15b73dc55ce/blinker-1.9.0.tar.gz", hash = "sha256:b4ce2265a7abece45e7cc896e98dbebe6cead56bcf805a3d23136d145f5445bf", size = 22460, upload-time = "2024-11-08T17:25:47.436Z" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/10/cb/f2ad4230dc2eb1a74edf38f1a38b9b52277f75bef262d8908e60d957e13c/blinker-1.9.0-py3-none-any.whl", hash = "sha256:ba0efaa9080b619ff2f3459d1d500c57bddea4a6b424b60a91141db6fd2f08bc", size = 8458, upload-time = "2024-11-08T17:25:46.184Z" }, +] + [[package]] name = "build" version = "1.2.2.post1" source = { registry = "https://pypi.org/simple" } dependencies = [ - { name = "colorama", marker = "os_name == 'nt' and sys_platform != 'linux'" }, + { name = "colorama", marker = "os_name == 'nt'" }, { name = "packaging" }, { name = "pyproject-hooks" }, ] @@ -452,18 +447,6 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/4e/8c/f3147f5c4b73e7550fe5f9352eaa956ae838d5c51eb58e7a25b9f3e2643b/decorator-5.2.1-py3-none-any.whl", hash = "sha256:d316bb415a2d9e2d2b3abcc4084c6502fc09240e292cd76a76afc106a1c8e04a", size = 9190, upload-time = "2025-02-24T04:41:32.565Z" }, ] -[[package]] -name = "decord" -version = "0.6.0" -source = { registry = "https://pypi.org/simple" } -dependencies = [ - { name = "numpy" }, -] -wheels = [ - { url = "https://files.pythonhosted.org/packages/11/79/936af42edf90a7bd4e41a6cac89c913d4b47fa48a26b042d5129a9242ee3/decord-0.6.0-py3-none-manylinux2010_x86_64.whl", hash = "sha256:51997f20be8958e23b7c4061ba45d0efcd86bffd5fe81c695d0befee0d442976", size = 13602299, upload-time = "2021-06-14T21:30:55.486Z" }, - { url = "https://files.pythonhosted.org/packages/6c/be/e15b5b866da452e62635a7b27513f31cb581fa2ea9cc9b768b535d62a955/decord-0.6.0-py3-none-win_amd64.whl", hash = "sha256:02665d7c4f1193a330205a791bc128f7e108eb6ae5b67144437a02f700943bad", size = 24733380, upload-time = "2021-06-14T21:30:57.766Z" }, -] - [[package]] name = "defusedxml" version = "0.7.1" @@ -557,6 +540,30 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/bb/61/78c7b3851add1481b048b5fdc29067397a1784e2910592bc81bb3f608635/fsspec-2025.5.1-py3-none-any.whl", hash = "sha256:24d3a2e663d5fc735ab256263c4075f374a174c3410c0b25e5bd1970bceaa462", size = 199052, upload-time = "2025-05-24T12:03:21.66Z" }, ] +[[package]] +name = "gitdb" +version = "4.0.12" +source = { registry = "https://pypi.org/simple" } +dependencies = [ + { name = "smmap" }, +] +sdist = { url = "https://files.pythonhosted.org/packages/72/94/63b0fc47eb32792c7ba1fe1b694daec9a63620db1e313033d18140c2320a/gitdb-4.0.12.tar.gz", hash = "sha256:5ef71f855d191a3326fcfbc0d5da835f26b13fbcba60c32c21091c349ffdb571", size = 394684, upload-time = "2025-01-02T07:20:46.413Z" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/a0/61/5c78b91c3143ed5c14207f463aecfc8f9dbb5092fb2869baf37c273b2705/gitdb-4.0.12-py3-none-any.whl", hash = "sha256:67073e15955400952c6565cc3e707c554a4eea2e428946f7a4c162fab9bd9bcf", size = 62794, upload-time = "2025-01-02T07:20:43.624Z" }, +] + +[[package]] +name = "gitpython" +version = "3.1.45" +source = { registry = "https://pypi.org/simple" } +dependencies = [ + { name = "gitdb" }, +] +sdist = { url = "https://files.pythonhosted.org/packages/9a/c8/dd58967d119baab745caec2f9d853297cec1989ec1d63f677d3880632b88/gitpython-3.1.45.tar.gz", hash = "sha256:85b0ee964ceddf211c41b9f27a49086010a190fd8132a24e21f362a4b36a791c", size = 215076, upload-time = "2025-07-24T03:45:54.871Z" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/01/61/d4b89fec821f72385526e1b9d9a3a0385dda4a72b206d28049e2c7cd39b8/gitpython-3.1.45-py3-none-any.whl", hash = "sha256:8908cb2e02fb3b93b7eb0f2827125cb699869470432cc885f019b8fd0fccff77", size = 208168, upload-time = "2025-07-24T03:45:52.517Z" }, +] + [[package]] name = "google-auth" version = "2.40.2" @@ -704,11 +711,6 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/d0/fb/5307bd3612eb0f0e62c3a916ae531d3a31e58fb5c82b58e3ebf7fd6f47a1/huggingface_hub-0.33.1-py3-none-any.whl", hash = "sha256:ec8d7444628210c0ba27e968e3c4c973032d44dcea59ca0d78ef3f612196f095", size = 515377, upload-time = "2025-06-25T12:02:55.611Z" }, ] -[package.optional-dependencies] -hf-xet = [ - { name = "hf-xet" }, -] - [[package]] name = "humanfriendly" version = "10.0" @@ -751,127 +753,6 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/a4/ed/1f1afb2e9e7f38a545d628f864d562a5ae64fe6f7a10e28ffb9b185b4e89/importlib_resources-6.5.2-py3-none-any.whl", hash = "sha256:789cfdc3ed28c78b67a06acb8126751ced69a3d5f79c095a98298cd8a760ccec", size = 37461, upload-time = "2025-01-03T18:51:54.306Z" }, ] -[[package]] -name = "intel-cmplr-lib-rt" -version = "2025.0.4" -source = { registry = "https://pypi.org/simple" } -resolution-markers = [ - "python_full_version >= '3.13' and sys_platform == 'linux'", - "python_full_version < '3.13' and sys_platform == 'linux'", -] -wheels = [ - { url = "https://files.pythonhosted.org/packages/c2/80/2a10995012a5d80cca2d8cac5d3a763116f1d57c272ee4f07ca94ba63a1a/intel_cmplr_lib_rt-2025.0.4-py2.py3-none-manylinux_2_28_x86_64.whl", hash = "sha256:440cf7cad2ed16f6a0a4589b03447b2d4fdae4f630ea26a4510e1cf5b40b1f1d", size = 45884211, upload-time = "2024-12-12T12:02:44.312Z" }, -] - -[[package]] -name = "intel-cmplr-lib-rt" -version = "2025.0.5" -source = { registry = "https://pypi.org/simple" } -resolution-markers = [ - "python_full_version >= '3.13' and sys_platform == 'win32'", - "python_full_version < '3.13' and sys_platform == 'win32'", -] -wheels = [ - { url = "https://files.pythonhosted.org/packages/1b/16/85f1f3c1ab200d369b9774b1b6121d2790c8b8647a135882106bcd3aadf9/intel_cmplr_lib_rt-2025.0.5-py2.py3-none-win_amd64.whl", hash = "sha256:928395dc2dc6e423439ff72e52cd02fc5e79686d5b14ce20f58461d8ed7d950a", size = 17271117, upload-time = "2025-02-11T10:59:27.047Z" }, -] - -[[package]] -name = "intel-cmplr-lib-ur" -version = "2025.0.4" -source = { registry = "https://pypi.org/simple" } -resolution-markers = [ - "python_full_version >= '3.13' and sys_platform == 'linux'", - "python_full_version < '3.13' and sys_platform == 'linux'", -] -dependencies = [ - { name = "umf", marker = "sys_platform == 'linux'" }, -] -wheels = [ - { url = "https://files.pythonhosted.org/packages/ae/d0/0d376a3eb3d5f8d0c0dd828a9f889e485d8ded1f7d501976c72916826cef/intel_cmplr_lib_ur-2025.0.4-py2.py3-none-manylinux_2_28_x86_64.whl", hash = "sha256:d36d586721f0cb87b051aca1bf3f653ccee7960f15efb0132e5482d95c5b2c9b", size = 25158275, upload-time = "2024-12-12T12:03:36.653Z" }, -] - -[[package]] -name = "intel-cmplr-lib-ur" -version = "2025.0.5" -source = { registry = "https://pypi.org/simple" } -resolution-markers = [ - "python_full_version >= '3.13' and sys_platform == 'win32'", - "python_full_version < '3.13' and sys_platform == 'win32'", -] -dependencies = [ - { name = "umf", marker = "sys_platform == 'win32'" }, -] -wheels = [ - { url = "https://files.pythonhosted.org/packages/1e/c1/23e258d315f4b39cd923236e6eba90d25f936968be7a0bdfc46b079cef25/intel_cmplr_lib_ur-2025.0.5-py2.py3-none-win_amd64.whl", hash = "sha256:d792c1cafada93aee1ab387e85ecd906a6bb0c0fc5d5fb9b2986c1dcaf301aae", size = 1163425, upload-time = "2025-02-11T10:59:31.57Z" }, -] - -[[package]] -name = "intel-cmplr-lic-rt" -version = "2025.0.4" -source = { registry = "https://pypi.org/simple" } -resolution-markers = [ - "python_full_version >= '3.13' and sys_platform == 'linux'", - "python_full_version < '3.13' and sys_platform == 'linux'", -] -wheels = [ - { url = "https://files.pythonhosted.org/packages/c3/18/77cc45b2e48f35c126f478116b65cad1025cd89ab58038a93fc2ce03a6e9/intel_cmplr_lic_rt-2025.0.4-py2.py3-none-manylinux_2_28_x86_64.whl", hash = "sha256:943d03ef2028cdb33140c84bad35b45d02186617ac0cd15849d179764132408a", size = 18913, upload-time = "2024-12-12T12:02:36.833Z" }, -] - -[[package]] -name = "intel-cmplr-lic-rt" -version = "2025.0.5" -source = { registry = "https://pypi.org/simple" } -resolution-markers = [ - "python_full_version >= '3.13' and sys_platform == 'win32'", - "python_full_version < '3.13' and sys_platform == 'win32'", -] -wheels = [ - { url = "https://files.pythonhosted.org/packages/83/b9/7ac88e49a14026446953c0d2cdf32198b043a10f0b43ad02e36c7b273501/intel_cmplr_lic_rt-2025.0.5-py2.py3-none-win_amd64.whl", hash = "sha256:2a37b5be844790664b7bf67aef33058103368face8ce1ff72643d6e2ffc3efbf", size = 49547, upload-time = "2025-02-11T10:59:46.543Z" }, -] - -[[package]] -name = "intel-pti" -version = "0.10.1" -source = { registry = "https://pypi.org/simple" } -wheels = [ - { url = "https://files.pythonhosted.org/packages/f0/f2/313e46be14a27d4fb6eaab683a0c7589b0227549e2bf596fa6ccc0df8f8f/intel_pti-0.10.1-py2.py3-none-manylinux_2_28_x86_64.whl", hash = "sha256:7e12361e8ac18996258c9d7f9ee831372c1c1c85028fa8502fb257e1dadf1de2", size = 678688, upload-time = "2025-02-20T11:29:43.507Z" }, - { url = "https://files.pythonhosted.org/packages/da/49/ac4c5413ae249cc79c0f04d926942a2802d3e5b6186d4bfe67db841f53f9/intel_pti-0.10.1-py2.py3-none-win_amd64.whl", hash = "sha256:bf9418aff05dd6807f3130eaae874ab2c5f79bcbfa1eaae7ba9b5c8ff8290038", size = 437518, upload-time = "2025-02-20T11:29:40.533Z" }, -] - -[[package]] -name = "intel-sycl-rt" -version = "2025.0.4" -source = { registry = "https://pypi.org/simple" } -resolution-markers = [ - "python_full_version >= '3.13' and sys_platform == 'linux'", - "python_full_version < '3.13' and sys_platform == 'linux'", -] -dependencies = [ - { name = "intel-cmplr-lib-rt", version = "2025.0.4", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'linux'" }, - { name = "intel-cmplr-lib-ur", version = "2025.0.4", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'linux'" }, - { name = "intel-cmplr-lic-rt", version = "2025.0.4", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'linux'" }, -] -wheels = [ - { url = "https://files.pythonhosted.org/packages/78/2b/3b99709cf8dd3304d05b853797a6fa962394ccf520536dc8e5eb9d3d9b1f/intel_sycl_rt-2025.0.4-py2.py3-none-manylinux_2_28_x86_64.whl", hash = "sha256:85c5fd6029f62e8361af1d9ddb0f6c6f9cf4912bbe9ad684f89e9e5842128879", size = 12356130, upload-time = "2024-12-12T12:03:18.87Z" }, -] - -[[package]] -name = "intel-sycl-rt" -version = "2025.0.5" -source = { registry = "https://pypi.org/simple" } -resolution-markers = [ - "python_full_version >= '3.13' and sys_platform == 'win32'", - "python_full_version < '3.13' and sys_platform == 'win32'", -] -dependencies = [ - { name = "intel-cmplr-lib-rt", version = "2025.0.5", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'win32'" }, - { name = "intel-cmplr-lib-ur", version = "2025.0.5", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'win32'" }, - { name = "intel-cmplr-lic-rt", version = "2025.0.5", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'win32'" }, -] -wheels = [ - { url = "https://files.pythonhosted.org/packages/0c/11/46cb85d052bf13153f2cb3994dbfda6116a06bff55d209d04b3f424d94d6/intel_sycl_rt-2025.0.5-py2.py3-none-win_amd64.whl", hash = "sha256:10a322b5bb9a180cbeea45fe2c8603bff55f4dedf6302fff7f66dafc191ff580", size = 10786985, upload-time = "2025-02-11T10:59:35.055Z" }, -] - [[package]] name = "ipykernel" version = "6.29.5" @@ -1161,7 +1042,7 @@ dependencies = [ { name = "overrides" }, { name = "packaging" }, { name = "prometheus-client" }, - { name = "pywinpty", marker = "os_name == 'nt' and sys_platform != 'linux'" }, + { name = "pywinpty", marker = "os_name == 'nt'" }, { name = "pyzmq" }, { name = "send2trash" }, { name = "terminado" }, @@ -1179,7 +1060,7 @@ name = "jupyter-server-terminals" version = "0.5.3" source = { registry = "https://pypi.org/simple" } dependencies = [ - { name = "pywinpty", marker = "os_name == 'nt' and sys_platform != 'linux'" }, + { name = "pywinpty", marker = "os_name == 'nt'" }, { name = "terminado" }, ] sdist = { url = "https://files.pythonhosted.org/packages/fc/d5/562469734f476159e99a55426d697cbf8e7eb5efe89fb0e0b4f83a3d3459/jupyter_server_terminals-0.5.3.tar.gz", hash = "sha256:5ae0295167220e9ace0edcfdb212afd2b01ee8d179fe6f23c899590e9b8a5269", size = 31430, upload-time = "2024-03-12T14:37:03.049Z" } @@ -1398,6 +1279,15 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/43/e3/7d92a15f894aa0c9c4b49b8ee9ac9850d6e63b03c9c32c0367a13ae62209/mpmath-1.3.0-py3-none-any.whl", hash = "sha256:a0b2b9fe80bbcd81a6647ff13108738cfb482d481d826cc0e02f5b35e5c88d2c", size = 536198, upload-time = "2023-03-07T16:47:09.197Z" }, ] +[[package]] +name = "narwhals" +version = "2.12.0" +source = { registry = "https://pypi.org/simple" } +sdist = { url = "https://files.pythonhosted.org/packages/93/f8/e1c28f24b641871c14ccae7ba6381f3c7827789a06e947ce975ae8a9075a/narwhals-2.12.0.tar.gz", hash = "sha256:075b6d56f3a222613793e025744b129439ecdff9292ea6615dd983af7ba6ea44", size = 590404, upload-time = "2025-11-17T10:53:28.381Z" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/0b/9a/c6f79de7ba3a0a8473129936b7b90aa461d3d46fec6f1627672b1dccf4e9/narwhals-2.12.0-py3-none-any.whl", hash = "sha256:baeba5d448a30b04c299a696bd9ee5ff73e4742143e06c49ca316b46539a7cbb", size = 425014, upload-time = "2025-11-17T10:53:26.65Z" }, +] + [[package]] name = "nbclient" version = "0.10.2" @@ -1537,6 +1427,139 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/67/0e/35082d13c09c02c011cf21570543d202ad929d961c02a147493cb0c2bdf5/numpy-2.2.6-cp313-cp313t-win_amd64.whl", hash = "sha256:6031dd6dfecc0cf9f668681a37648373bddd6421fff6c66ec1624eed0180ee06", size = 12771374, upload-time = "2025-05-17T21:43:35.479Z" }, ] +[[package]] +name = "nvidia-cublas-cu12" +version = "12.6.4.1" +source = { registry = "https://pypi.org/simple" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/af/eb/ff4b8c503fa1f1796679dce648854d58751982426e4e4b37d6fce49d259c/nvidia_cublas_cu12-12.6.4.1-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:08ed2686e9875d01b58e3cb379c6896df8e76c75e0d4a7f7dace3d7b6d9ef8eb", size = 393138322, upload-time = "2024-11-20T17:40:25.65Z" }, +] + +[[package]] +name = "nvidia-cuda-cupti-cu12" +version = "12.6.80" +source = { registry = "https://pypi.org/simple" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/49/60/7b6497946d74bcf1de852a21824d63baad12cd417db4195fc1bfe59db953/nvidia_cuda_cupti_cu12-12.6.80-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:6768bad6cab4f19e8292125e5f1ac8aa7d1718704012a0e3272a6f61c4bce132", size = 8917980, upload-time = "2024-11-20T17:36:04.019Z" }, + { url = "https://files.pythonhosted.org/packages/a5/24/120ee57b218d9952c379d1e026c4479c9ece9997a4fb46303611ee48f038/nvidia_cuda_cupti_cu12-12.6.80-py3-none-manylinux2014_x86_64.whl", hash = "sha256:a3eff6cdfcc6a4c35db968a06fcadb061cbc7d6dde548609a941ff8701b98b73", size = 8917972, upload-time = "2024-10-01T16:58:06.036Z" }, +] + +[[package]] +name = "nvidia-cuda-nvrtc-cu12" +version = "12.6.77" +source = { registry = "https://pypi.org/simple" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/75/2e/46030320b5a80661e88039f59060d1790298b4718944a65a7f2aeda3d9e9/nvidia_cuda_nvrtc_cu12-12.6.77-py3-none-manylinux2014_x86_64.whl", hash = "sha256:35b0cc6ee3a9636d5409133e79273ce1f3fd087abb0532d2d2e8fff1fe9efc53", size = 23650380, upload-time = "2024-10-01T17:00:14.643Z" }, +] + +[[package]] +name = "nvidia-cuda-runtime-cu12" +version = "12.6.77" +source = { registry = "https://pypi.org/simple" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/e1/23/e717c5ac26d26cf39a27fbc076240fad2e3b817e5889d671b67f4f9f49c5/nvidia_cuda_runtime_cu12-12.6.77-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:ba3b56a4f896141e25e19ab287cd71e52a6a0f4b29d0d31609f60e3b4d5219b7", size = 897690, upload-time = "2024-11-20T17:35:30.697Z" }, + { url = "https://files.pythonhosted.org/packages/f0/62/65c05e161eeddbafeca24dc461f47de550d9fa8a7e04eb213e32b55cfd99/nvidia_cuda_runtime_cu12-12.6.77-py3-none-manylinux2014_x86_64.whl", hash = "sha256:a84d15d5e1da416dd4774cb42edf5e954a3e60cc945698dc1d5be02321c44dc8", size = 897678, upload-time = "2024-10-01T16:57:33.821Z" }, +] + +[[package]] +name = "nvidia-cudnn-cu12" +version = "9.5.1.17" +source = { registry = "https://pypi.org/simple" } +dependencies = [ + { name = "nvidia-cublas-cu12" }, +] +wheels = [ + { url = "https://files.pythonhosted.org/packages/2a/78/4535c9c7f859a64781e43c969a3a7e84c54634e319a996d43ef32ce46f83/nvidia_cudnn_cu12-9.5.1.17-py3-none-manylinux_2_28_x86_64.whl", hash = "sha256:30ac3869f6db17d170e0e556dd6cc5eee02647abc31ca856634d5a40f82c15b2", size = 570988386, upload-time = "2024-10-25T19:54:26.39Z" }, +] + +[[package]] +name = "nvidia-cufft-cu12" +version = "11.3.0.4" +source = { registry = "https://pypi.org/simple" } +dependencies = [ + { name = "nvidia-nvjitlink-cu12" }, +] +wheels = [ + { url = "https://files.pythonhosted.org/packages/8f/16/73727675941ab8e6ffd86ca3a4b7b47065edcca7a997920b831f8147c99d/nvidia_cufft_cu12-11.3.0.4-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:ccba62eb9cef5559abd5e0d54ceed2d9934030f51163df018532142a8ec533e5", size = 200221632, upload-time = "2024-11-20T17:41:32.357Z" }, + { url = "https://files.pythonhosted.org/packages/60/de/99ec247a07ea40c969d904fc14f3a356b3e2a704121675b75c366b694ee1/nvidia_cufft_cu12-11.3.0.4-py3-none-manylinux2014_x86_64.whl", hash = "sha256:768160ac89f6f7b459bee747e8d175dbf53619cfe74b2a5636264163138013ca", size = 200221622, upload-time = "2024-10-01T17:03:58.79Z" }, +] + +[[package]] +name = "nvidia-cufile-cu12" +version = "1.11.1.6" +source = { registry = "https://pypi.org/simple" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/b2/66/cc9876340ac68ae71b15c743ddb13f8b30d5244af344ec8322b449e35426/nvidia_cufile_cu12-1.11.1.6-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:cc23469d1c7e52ce6c1d55253273d32c565dd22068647f3aa59b3c6b005bf159", size = 1142103, upload-time = "2024-11-20T17:42:11.83Z" }, +] + +[[package]] +name = "nvidia-curand-cu12" +version = "10.3.7.77" +source = { registry = "https://pypi.org/simple" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/73/1b/44a01c4e70933637c93e6e1a8063d1e998b50213a6b65ac5a9169c47e98e/nvidia_curand_cu12-10.3.7.77-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:a42cd1344297f70b9e39a1e4f467a4e1c10f1da54ff7a85c12197f6c652c8bdf", size = 56279010, upload-time = "2024-11-20T17:42:50.958Z" }, + { url = "https://files.pythonhosted.org/packages/4a/aa/2c7ff0b5ee02eaef890c0ce7d4f74bc30901871c5e45dee1ae6d0083cd80/nvidia_curand_cu12-10.3.7.77-py3-none-manylinux2014_x86_64.whl", hash = "sha256:99f1a32f1ac2bd134897fc7a203f779303261268a65762a623bf30cc9fe79117", size = 56279000, upload-time = "2024-10-01T17:04:45.274Z" }, +] + +[[package]] +name = "nvidia-cusolver-cu12" +version = "11.7.1.2" +source = { registry = "https://pypi.org/simple" } +dependencies = [ + { name = "nvidia-cublas-cu12" }, + { name = "nvidia-cusparse-cu12" }, + { name = "nvidia-nvjitlink-cu12" }, +] +wheels = [ + { url = "https://files.pythonhosted.org/packages/f0/6e/c2cf12c9ff8b872e92b4a5740701e51ff17689c4d726fca91875b07f655d/nvidia_cusolver_cu12-11.7.1.2-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:e9e49843a7707e42022babb9bcfa33c29857a93b88020c4e4434656a655b698c", size = 158229790, upload-time = "2024-11-20T17:43:43.211Z" }, + { url = "https://files.pythonhosted.org/packages/9f/81/baba53585da791d043c10084cf9553e074548408e04ae884cfe9193bd484/nvidia_cusolver_cu12-11.7.1.2-py3-none-manylinux2014_x86_64.whl", hash = "sha256:6cf28f17f64107a0c4d7802be5ff5537b2130bfc112f25d5a30df227058ca0e6", size = 158229780, upload-time = "2024-10-01T17:05:39.875Z" }, +] + +[[package]] +name = "nvidia-cusparse-cu12" +version = "12.5.4.2" +source = { registry = "https://pypi.org/simple" } +dependencies = [ + { name = "nvidia-nvjitlink-cu12" }, +] +wheels = [ + { url = "https://files.pythonhosted.org/packages/06/1e/b8b7c2f4099a37b96af5c9bb158632ea9e5d9d27d7391d7eb8fc45236674/nvidia_cusparse_cu12-12.5.4.2-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:7556d9eca156e18184b94947ade0fba5bb47d69cec46bf8660fd2c71a4b48b73", size = 216561367, upload-time = "2024-11-20T17:44:54.824Z" }, + { url = "https://files.pythonhosted.org/packages/43/ac/64c4316ba163e8217a99680c7605f779accffc6a4bcd0c778c12948d3707/nvidia_cusparse_cu12-12.5.4.2-py3-none-manylinux2014_x86_64.whl", hash = "sha256:23749a6571191a215cb74d1cdbff4a86e7b19f1200c071b3fcf844a5bea23a2f", size = 216561357, upload-time = "2024-10-01T17:06:29.861Z" }, +] + +[[package]] +name = "nvidia-cusparselt-cu12" +version = "0.6.3" +source = { registry = "https://pypi.org/simple" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/3b/9a/72ef35b399b0e183bc2e8f6f558036922d453c4d8237dab26c666a04244b/nvidia_cusparselt_cu12-0.6.3-py3-none-manylinux2014_x86_64.whl", hash = "sha256:e5c8a26c36445dd2e6812f1177978a24e2d37cacce7e090f297a688d1ec44f46", size = 156785796, upload-time = "2024-10-15T21:29:17.709Z" }, +] + +[[package]] +name = "nvidia-nccl-cu12" +version = "2.26.2" +source = { registry = "https://pypi.org/simple" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/67/ca/f42388aed0fddd64ade7493dbba36e1f534d4e6fdbdd355c6a90030ae028/nvidia_nccl_cu12-2.26.2-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:694cf3879a206553cc9d7dbda76b13efaf610fdb70a50cba303de1b0d1530ac6", size = 201319755, upload-time = "2025-03-13T00:29:55.296Z" }, +] + +[[package]] +name = "nvidia-nvjitlink-cu12" +version = "12.6.85" +source = { registry = "https://pypi.org/simple" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/9d/d7/c5383e47c7e9bf1c99d5bd2a8c935af2b6d705ad831a7ec5c97db4d82f4f/nvidia_nvjitlink_cu12-12.6.85-py3-none-manylinux2010_x86_64.manylinux_2_12_x86_64.whl", hash = "sha256:eedc36df9e88b682efe4309aa16b5b4e78c2407eac59e8c10a6a47535164369a", size = 19744971, upload-time = "2024-11-20T17:46:53.366Z" }, +] + +[[package]] +name = "nvidia-nvtx-cu12" +version = "12.6.77" +source = { registry = "https://pypi.org/simple" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/56/9a/fff8376f8e3d084cd1530e1ef7b879bb7d6d265620c95c1b322725c694f4/nvidia_nvtx_cu12-12.6.77-py3-none-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:b90bed3df379fa79afbd21be8e04a0314336b8ae16768b58f2d34cb1d04cd7d2", size = 89276, upload-time = "2024-11-20T17:38:27.621Z" }, + { url = "https://files.pythonhosted.org/packages/9e/4e/0d0c945463719429b7bd21dece907ad0bde437a2ff12b9b12fee94722ab0/nvidia_nvtx_cu12-12.6.77-py3-none-manylinux2014_x86_64.whl", hash = "sha256:6574241a3ec5fdc9334353ab8c479fe75841dbe8f4532a8fc97ce63503330ba1", size = 89265, upload-time = "2024-10-01T17:00:38.172Z" }, +] + [[package]] name = "oauthlib" version = "3.2.2" @@ -1546,6 +1569,19 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/7e/80/cab10959dc1faead58dc8384a781dfbf93cb4d33d50988f7a69f1b7c9bbe/oauthlib-3.2.2-py3-none-any.whl", hash = "sha256:8139f29aac13e25d502680e9e19963e83f16838d48a0d71c287fe40e7067fbca", size = 151688, upload-time = "2022-10-17T20:04:24.037Z" }, ] +[[package]] +name = "ollama" +version = "0.6.1" +source = { registry = "https://pypi.org/simple" } +dependencies = [ + { name = "httpx" }, + { name = "pydantic" }, +] +sdist = { url = "https://files.pythonhosted.org/packages/9d/5a/652dac4b7affc2b37b95386f8ae78f22808af09d720689e3d7a86b6ed98e/ollama-0.6.1.tar.gz", hash = "sha256:478c67546836430034b415ed64fa890fd3d1ff91781a9d548b3325274e69d7c6", size = 51620, upload-time = "2025-11-13T23:02:17.416Z" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/47/4f/4a617ee93d8208d2bcf26b2d8b9402ceaed03e3853c754940e2290fed063/ollama-0.6.1-py3-none-any.whl", hash = "sha256:fc4c984b345735c5486faeee67d8a265214a31cbb828167782dc642ce0a2bf8c", size = 14354, upload-time = "2025-11-13T23:02:16.292Z" }, +] + [[package]] name = "onnxruntime" version = "1.22.0" @@ -1571,6 +1607,23 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/c3/16/873b955beda7bada5b0d798d3a601b2ff210e44ad5169f6d405b93892103/onnxruntime-1.22.0-cp313-cp313t-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:64845709f9e8a2809e8e009bc4c8f73b788cee9c6619b7d9930344eae4c9cd36", size = 16427482, upload-time = "2025-05-09T20:26:20.376Z" }, ] +[[package]] +name = "opencv-python" +version = "4.12.0.88" +source = { registry = "https://pypi.org/simple" } +dependencies = [ + { name = "numpy" }, +] +sdist = { url = "https://files.pythonhosted.org/packages/ac/71/25c98e634b6bdeca4727c7f6d6927b056080668c5008ad3c8fc9e7f8f6ec/opencv-python-4.12.0.88.tar.gz", hash = "sha256:8b738389cede219405f6f3880b851efa3415ccd674752219377353f017d2994d", size = 95373294, upload-time = "2025-07-07T09:20:52.389Z" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/85/68/3da40142e7c21e9b1d4e7ddd6c58738feb013203e6e4b803d62cdd9eb96b/opencv_python-4.12.0.88-cp37-abi3-macosx_13_0_arm64.whl", hash = "sha256:f9a1f08883257b95a5764bf517a32d75aec325319c8ed0f89739a57fae9e92a5", size = 37877727, upload-time = "2025-07-07T09:13:31.47Z" }, + { url = "https://files.pythonhosted.org/packages/33/7c/042abe49f58d6ee7e1028eefc3334d98ca69b030e3b567fe245a2b28ea6f/opencv_python-4.12.0.88-cp37-abi3-macosx_13_0_x86_64.whl", hash = "sha256:812eb116ad2b4de43ee116fcd8991c3a687f099ada0b04e68f64899c09448e81", size = 57326471, upload-time = "2025-07-07T09:13:41.26Z" }, + { url = "https://files.pythonhosted.org/packages/62/3a/440bd64736cf8116f01f3b7f9f2e111afb2e02beb2ccc08a6458114a6b5d/opencv_python-4.12.0.88-cp37-abi3-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:51fd981c7df6af3e8f70b1556696b05224c4e6b6777bdd2a46b3d4fb09de1a92", size = 45887139, upload-time = "2025-07-07T09:13:50.761Z" }, + { url = "https://files.pythonhosted.org/packages/68/1f/795e7f4aa2eacc59afa4fb61a2e35e510d06414dd5a802b51a012d691b37/opencv_python-4.12.0.88-cp37-abi3-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:092c16da4c5a163a818f120c22c5e4a2f96e0db4f24e659c701f1fe629a690f9", size = 67041680, upload-time = "2025-07-07T09:14:01.995Z" }, + { url = "https://files.pythonhosted.org/packages/02/96/213fea371d3cb2f1d537612a105792aa0a6659fb2665b22cad709a75bd94/opencv_python-4.12.0.88-cp37-abi3-win32.whl", hash = "sha256:ff554d3f725b39878ac6a2e1fa232ec509c36130927afc18a1719ebf4fbf4357", size = 30284131, upload-time = "2025-07-07T09:14:08.819Z" }, + { url = "https://files.pythonhosted.org/packages/fa/80/eb88edc2e2b11cd2dd2e56f1c80b5784d11d6e6b7f04a1145df64df40065/opencv_python-4.12.0.88-cp37-abi3-win_amd64.whl", hash = "sha256:d98edb20aa932fd8ebd276a72627dad9dc097695b3d435a4257557bbb49a79d2", size = 39000307, upload-time = "2025-07-07T09:14:16.641Z" }, +] + [[package]] name = "opentelemetry-api" version = "1.33.1" @@ -1709,6 +1762,53 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/20/12/38679034af332785aac8774540895e234f4d07f7545804097de4b666afd8/packaging-25.0-py3-none-any.whl", hash = "sha256:29572ef2b1f17581046b3a2227d5c611fb25ec70ca1ba8554b24b0e69331a484", size = 66469, upload-time = "2025-04-19T11:48:57.875Z" }, ] +[[package]] +name = "pandas" +version = "2.3.3" +source = { registry = "https://pypi.org/simple" } +dependencies = [ + { name = "numpy" }, + { name = "python-dateutil" }, + { name = "pytz" }, + { name = "tzdata" }, +] +sdist = { url = "https://files.pythonhosted.org/packages/33/01/d40b85317f86cf08d853a4f495195c73815fdf205eef3993821720274518/pandas-2.3.3.tar.gz", hash = "sha256:e05e1af93b977f7eafa636d043f9f94c7ee3ac81af99c13508215942e64c993b", size = 4495223, upload-time = "2025-09-29T23:34:51.853Z" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/9c/fb/231d89e8637c808b997d172b18e9d4a4bc7bf31296196c260526055d1ea0/pandas-2.3.3-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:6d21f6d74eb1725c2efaa71a2bfc661a0689579b58e9c0ca58a739ff0b002b53", size = 11597846, upload-time = "2025-09-29T23:19:48.856Z" }, + { url = "https://files.pythonhosted.org/packages/5c/bd/bf8064d9cfa214294356c2d6702b716d3cf3bb24be59287a6a21e24cae6b/pandas-2.3.3-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:3fd2f887589c7aa868e02632612ba39acb0b8948faf5cc58f0850e165bd46f35", size = 10729618, upload-time = "2025-09-29T23:39:08.659Z" }, + { url = "https://files.pythonhosted.org/packages/57/56/cf2dbe1a3f5271370669475ead12ce77c61726ffd19a35546e31aa8edf4e/pandas-2.3.3-cp312-cp312-manylinux_2_24_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:ecaf1e12bdc03c86ad4a7ea848d66c685cb6851d807a26aa245ca3d2017a1908", size = 11737212, upload-time = "2025-09-29T23:19:59.765Z" }, + { url = "https://files.pythonhosted.org/packages/e5/63/cd7d615331b328e287d8233ba9fdf191a9c2d11b6af0c7a59cfcec23de68/pandas-2.3.3-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:b3d11d2fda7eb164ef27ffc14b4fcab16a80e1ce67e9f57e19ec0afaf715ba89", size = 12362693, upload-time = "2025-09-29T23:20:14.098Z" }, + { url = "https://files.pythonhosted.org/packages/a6/de/8b1895b107277d52f2b42d3a6806e69cfef0d5cf1d0ba343470b9d8e0a04/pandas-2.3.3-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:a68e15f780eddf2b07d242e17a04aa187a7ee12b40b930bfdd78070556550e98", size = 12771002, upload-time = "2025-09-29T23:20:26.76Z" }, + { url = "https://files.pythonhosted.org/packages/87/21/84072af3187a677c5893b170ba2c8fbe450a6ff911234916da889b698220/pandas-2.3.3-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:371a4ab48e950033bcf52b6527eccb564f52dc826c02afd9a1bc0ab731bba084", size = 13450971, upload-time = "2025-09-29T23:20:41.344Z" }, + { url = "https://files.pythonhosted.org/packages/86/41/585a168330ff063014880a80d744219dbf1dd7a1c706e75ab3425a987384/pandas-2.3.3-cp312-cp312-win_amd64.whl", hash = "sha256:a16dcec078a01eeef8ee61bf64074b4e524a2a3f4b3be9326420cabe59c4778b", size = 10992722, upload-time = "2025-09-29T23:20:54.139Z" }, + { url = "https://files.pythonhosted.org/packages/cd/4b/18b035ee18f97c1040d94debd8f2e737000ad70ccc8f5513f4eefad75f4b/pandas-2.3.3-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:56851a737e3470de7fa88e6131f41281ed440d29a9268dcbf0002da5ac366713", size = 11544671, upload-time = "2025-09-29T23:21:05.024Z" }, + { url = "https://files.pythonhosted.org/packages/31/94/72fac03573102779920099bcac1c3b05975c2cb5f01eac609faf34bed1ca/pandas-2.3.3-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:bdcd9d1167f4885211e401b3036c0c8d9e274eee67ea8d0758a256d60704cfe8", size = 10680807, upload-time = "2025-09-29T23:21:15.979Z" }, + { url = "https://files.pythonhosted.org/packages/16/87/9472cf4a487d848476865321de18cc8c920b8cab98453ab79dbbc98db63a/pandas-2.3.3-cp313-cp313-manylinux_2_24_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:e32e7cc9af0f1cc15548288a51a3b681cc2a219faa838e995f7dc53dbab1062d", size = 11709872, upload-time = "2025-09-29T23:21:27.165Z" }, + { url = "https://files.pythonhosted.org/packages/15/07/284f757f63f8a8d69ed4472bfd85122bd086e637bf4ed09de572d575a693/pandas-2.3.3-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:318d77e0e42a628c04dc56bcef4b40de67918f7041c2b061af1da41dcff670ac", size = 12306371, upload-time = "2025-09-29T23:21:40.532Z" }, + { url = "https://files.pythonhosted.org/packages/33/81/a3afc88fca4aa925804a27d2676d22dcd2031c2ebe08aabd0ae55b9ff282/pandas-2.3.3-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:4e0a175408804d566144e170d0476b15d78458795bb18f1304fb94160cabf40c", size = 12765333, upload-time = "2025-09-29T23:21:55.77Z" }, + { url = "https://files.pythonhosted.org/packages/8d/0f/b4d4ae743a83742f1153464cf1a8ecfafc3ac59722a0b5c8602310cb7158/pandas-2.3.3-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:93c2d9ab0fc11822b5eece72ec9587e172f63cff87c00b062f6e37448ced4493", size = 13418120, upload-time = "2025-09-29T23:22:10.109Z" }, + { url = "https://files.pythonhosted.org/packages/4f/c7/e54682c96a895d0c808453269e0b5928a07a127a15704fedb643e9b0a4c8/pandas-2.3.3-cp313-cp313-win_amd64.whl", hash = "sha256:f8bfc0e12dc78f777f323f55c58649591b2cd0c43534e8355c51d3fede5f4dee", size = 10993991, upload-time = "2025-09-29T23:25:04.889Z" }, + { url = "https://files.pythonhosted.org/packages/f9/ca/3f8d4f49740799189e1395812f3bf23b5e8fc7c190827d55a610da72ce55/pandas-2.3.3-cp313-cp313t-macosx_10_13_x86_64.whl", hash = "sha256:75ea25f9529fdec2d2e93a42c523962261e567d250b0013b16210e1d40d7c2e5", size = 12048227, upload-time = "2025-09-29T23:22:24.343Z" }, + { url = "https://files.pythonhosted.org/packages/0e/5a/f43efec3e8c0cc92c4663ccad372dbdff72b60bdb56b2749f04aa1d07d7e/pandas-2.3.3-cp313-cp313t-macosx_11_0_arm64.whl", hash = "sha256:74ecdf1d301e812db96a465a525952f4dde225fdb6d8e5a521d47e1f42041e21", size = 11411056, upload-time = "2025-09-29T23:22:37.762Z" }, + { url = "https://files.pythonhosted.org/packages/46/b1/85331edfc591208c9d1a63a06baa67b21d332e63b7a591a5ba42a10bb507/pandas-2.3.3-cp313-cp313t-manylinux_2_24_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:6435cb949cb34ec11cc9860246ccb2fdc9ecd742c12d3304989017d53f039a78", size = 11645189, upload-time = "2025-09-29T23:22:51.688Z" }, + { url = "https://files.pythonhosted.org/packages/44/23/78d645adc35d94d1ac4f2a3c4112ab6f5b8999f4898b8cdf01252f8df4a9/pandas-2.3.3-cp313-cp313t-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:900f47d8f20860de523a1ac881c4c36d65efcb2eb850e6948140fa781736e110", size = 12121912, upload-time = "2025-09-29T23:23:05.042Z" }, + { url = "https://files.pythonhosted.org/packages/53/da/d10013df5e6aaef6b425aa0c32e1fc1f3e431e4bcabd420517dceadce354/pandas-2.3.3-cp313-cp313t-musllinux_1_2_aarch64.whl", hash = "sha256:a45c765238e2ed7d7c608fc5bc4a6f88b642f2f01e70c0c23d2224dd21829d86", size = 12712160, upload-time = "2025-09-29T23:23:28.57Z" }, + { url = "https://files.pythonhosted.org/packages/bd/17/e756653095a083d8a37cbd816cb87148debcfcd920129b25f99dd8d04271/pandas-2.3.3-cp313-cp313t-musllinux_1_2_x86_64.whl", hash = "sha256:c4fc4c21971a1a9f4bdb4c73978c7f7256caa3e62b323f70d6cb80db583350bc", size = 13199233, upload-time = "2025-09-29T23:24:24.876Z" }, + { url = "https://files.pythonhosted.org/packages/04/fd/74903979833db8390b73b3a8a7d30d146d710bd32703724dd9083950386f/pandas-2.3.3-cp314-cp314-macosx_10_13_x86_64.whl", hash = "sha256:ee15f284898e7b246df8087fc82b87b01686f98ee67d85a17b7ab44143a3a9a0", size = 11540635, upload-time = "2025-09-29T23:25:52.486Z" }, + { url = "https://files.pythonhosted.org/packages/21/00/266d6b357ad5e6d3ad55093a7e8efc7dd245f5a842b584db9f30b0f0a287/pandas-2.3.3-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:1611aedd912e1ff81ff41c745822980c49ce4a7907537be8692c8dbc31924593", size = 10759079, upload-time = "2025-09-29T23:26:33.204Z" }, + { url = "https://files.pythonhosted.org/packages/ca/05/d01ef80a7a3a12b2f8bbf16daba1e17c98a2f039cbc8e2f77a2c5a63d382/pandas-2.3.3-cp314-cp314-manylinux_2_24_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:6d2cefc361461662ac48810cb14365a365ce864afe85ef1f447ff5a1e99ea81c", size = 11814049, upload-time = "2025-09-29T23:27:15.384Z" }, + { url = "https://files.pythonhosted.org/packages/15/b2/0e62f78c0c5ba7e3d2c5945a82456f4fac76c480940f805e0b97fcbc2f65/pandas-2.3.3-cp314-cp314-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:ee67acbbf05014ea6c763beb097e03cd629961c8a632075eeb34247120abcb4b", size = 12332638, upload-time = "2025-09-29T23:27:51.625Z" }, + { url = "https://files.pythonhosted.org/packages/c5/33/dd70400631b62b9b29c3c93d2feee1d0964dc2bae2e5ad7a6c73a7f25325/pandas-2.3.3-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:c46467899aaa4da076d5abc11084634e2d197e9460643dd455ac3db5856b24d6", size = 12886834, upload-time = "2025-09-29T23:28:21.289Z" }, + { url = "https://files.pythonhosted.org/packages/d3/18/b5d48f55821228d0d2692b34fd5034bb185e854bdb592e9c640f6290e012/pandas-2.3.3-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:6253c72c6a1d990a410bc7de641d34053364ef8bcd3126f7e7450125887dffe3", size = 13409925, upload-time = "2025-09-29T23:28:58.261Z" }, + { url = "https://files.pythonhosted.org/packages/a6/3d/124ac75fcd0ecc09b8fdccb0246ef65e35b012030defb0e0eba2cbbbe948/pandas-2.3.3-cp314-cp314-win_amd64.whl", hash = "sha256:1b07204a219b3b7350abaae088f451860223a52cfb8a6c53358e7948735158e5", size = 11109071, upload-time = "2025-09-29T23:32:27.484Z" }, + { url = "https://files.pythonhosted.org/packages/89/9c/0e21c895c38a157e0faa1fb64587a9226d6dd46452cac4532d80c3c4a244/pandas-2.3.3-cp314-cp314t-macosx_10_13_x86_64.whl", hash = "sha256:2462b1a365b6109d275250baaae7b760fd25c726aaca0054649286bcfbb3e8ec", size = 12048504, upload-time = "2025-09-29T23:29:31.47Z" }, + { url = "https://files.pythonhosted.org/packages/d7/82/b69a1c95df796858777b68fbe6a81d37443a33319761d7c652ce77797475/pandas-2.3.3-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:0242fe9a49aa8b4d78a4fa03acb397a58833ef6199e9aa40a95f027bb3a1b6e7", size = 11410702, upload-time = "2025-09-29T23:29:54.591Z" }, + { url = "https://files.pythonhosted.org/packages/f9/88/702bde3ba0a94b8c73a0181e05144b10f13f29ebfc2150c3a79062a8195d/pandas-2.3.3-cp314-cp314t-manylinux_2_24_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:a21d830e78df0a515db2b3d2f5570610f5e6bd2e27749770e8bb7b524b89b450", size = 11634535, upload-time = "2025-09-29T23:30:21.003Z" }, + { url = "https://files.pythonhosted.org/packages/a4/1e/1bac1a839d12e6a82ec6cb40cda2edde64a2013a66963293696bbf31fbbb/pandas-2.3.3-cp314-cp314t-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:2e3ebdb170b5ef78f19bfb71b0dc5dc58775032361fa188e814959b74d726dd5", size = 12121582, upload-time = "2025-09-29T23:30:43.391Z" }, + { url = "https://files.pythonhosted.org/packages/44/91/483de934193e12a3b1d6ae7c8645d083ff88dec75f46e827562f1e4b4da6/pandas-2.3.3-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:d051c0e065b94b7a3cea50eb1ec32e912cd96dba41647eb24104b6c6c14c5788", size = 12699963, upload-time = "2025-09-29T23:31:10.009Z" }, + { url = "https://files.pythonhosted.org/packages/70/44/5191d2e4026f86a2a109053e194d3ba7a31a2d10a9c2348368c63ed4e85a/pandas-2.3.3-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:3869faf4bd07b3b66a9f462417d0ca3a9df29a9f6abd5d0d0dbab15dac7abe87", size = 13202175, upload-time = "2025-09-29T23:31:59.173Z" }, +] + [[package]] name = "pandocfilters" version = "1.5.1" @@ -1732,7 +1832,7 @@ name = "pexpect" version = "4.9.0" source = { registry = "https://pypi.org/simple" } dependencies = [ - { name = "ptyprocess", marker = "sys_platform != 'win32'" }, + { name = "ptyprocess" }, ] sdist = { url = "https://files.pythonhosted.org/packages/42/92/cc564bf6381ff43ce1f4d06852fc19a2f11d180f23dc32d9588bee2f149d/pexpect-4.9.0.tar.gz", hash = "sha256:ee7d41123f3c9911050ea2c2dac107568dc43b2d3b0c7557a33212c398ead30f", size = 166450, upload-time = "2023-11-25T09:07:26.339Z" } wheels = [ @@ -1873,6 +1973,35 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/8e/37/efad0257dc6e593a18957422533ff0f87ede7c9c6ea010a2177d738fb82f/pure_eval-0.2.3-py3-none-any.whl", hash = "sha256:1db8e35b67b3d218d818ae653e27f06c3aa420901fa7b081ca98cbedc874e0d0", size = 11842, upload-time = "2024-07-21T12:58:20.04Z" }, ] +[[package]] +name = "pyarrow" +version = "21.0.0" +source = { registry = "https://pypi.org/simple" } +sdist = { url = "https://files.pythonhosted.org/packages/ef/c2/ea068b8f00905c06329a3dfcd40d0fcc2b7d0f2e355bdb25b65e0a0e4cd4/pyarrow-21.0.0.tar.gz", hash = "sha256:5051f2dccf0e283ff56335760cbc8622cf52264d67e359d5569541ac11b6d5bc", size = 1133487, upload-time = "2025-07-18T00:57:31.761Z" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/ca/d4/d4f817b21aacc30195cf6a46ba041dd1be827efa4a623cc8bf39a1c2a0c0/pyarrow-21.0.0-cp312-cp312-macosx_12_0_arm64.whl", hash = "sha256:3a302f0e0963db37e0a24a70c56cf91a4faa0bca51c23812279ca2e23481fccd", size = 31160305, upload-time = "2025-07-18T00:55:35.373Z" }, + { url = "https://files.pythonhosted.org/packages/a2/9c/dcd38ce6e4b4d9a19e1d36914cb8e2b1da4e6003dd075474c4cfcdfe0601/pyarrow-21.0.0-cp312-cp312-macosx_12_0_x86_64.whl", hash = "sha256:b6b27cf01e243871390474a211a7922bfbe3bda21e39bc9160daf0da3fe48876", size = 32684264, upload-time = "2025-07-18T00:55:39.303Z" }, + { url = "https://files.pythonhosted.org/packages/4f/74/2a2d9f8d7a59b639523454bec12dba35ae3d0a07d8ab529dc0809f74b23c/pyarrow-21.0.0-cp312-cp312-manylinux_2_28_aarch64.whl", hash = "sha256:e72a8ec6b868e258a2cd2672d91f2860ad532d590ce94cdf7d5e7ec674ccf03d", size = 41108099, upload-time = "2025-07-18T00:55:42.889Z" }, + { url = "https://files.pythonhosted.org/packages/ad/90/2660332eeb31303c13b653ea566a9918484b6e4d6b9d2d46879a33ab0622/pyarrow-21.0.0-cp312-cp312-manylinux_2_28_x86_64.whl", hash = "sha256:b7ae0bbdc8c6674259b25bef5d2a1d6af5d39d7200c819cf99e07f7dfef1c51e", size = 42829529, upload-time = "2025-07-18T00:55:47.069Z" }, + { url = "https://files.pythonhosted.org/packages/33/27/1a93a25c92717f6aa0fca06eb4700860577d016cd3ae51aad0e0488ac899/pyarrow-21.0.0-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:58c30a1729f82d201627c173d91bd431db88ea74dcaa3885855bc6203e433b82", size = 43367883, upload-time = "2025-07-18T00:55:53.069Z" }, + { url = "https://files.pythonhosted.org/packages/05/d9/4d09d919f35d599bc05c6950095e358c3e15148ead26292dfca1fb659b0c/pyarrow-21.0.0-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:072116f65604b822a7f22945a7a6e581cfa28e3454fdcc6939d4ff6090126623", size = 45133802, upload-time = "2025-07-18T00:55:57.714Z" }, + { url = "https://files.pythonhosted.org/packages/71/30/f3795b6e192c3ab881325ffe172e526499eb3780e306a15103a2764916a2/pyarrow-21.0.0-cp312-cp312-win_amd64.whl", hash = "sha256:cf56ec8b0a5c8c9d7021d6fd754e688104f9ebebf1bf4449613c9531f5346a18", size = 26203175, upload-time = "2025-07-18T00:56:01.364Z" }, + { url = "https://files.pythonhosted.org/packages/16/ca/c7eaa8e62db8fb37ce942b1ea0c6d7abfe3786ca193957afa25e71b81b66/pyarrow-21.0.0-cp313-cp313-macosx_12_0_arm64.whl", hash = "sha256:e99310a4ebd4479bcd1964dff9e14af33746300cb014aa4a3781738ac63baf4a", size = 31154306, upload-time = "2025-07-18T00:56:04.42Z" }, + { url = "https://files.pythonhosted.org/packages/ce/e8/e87d9e3b2489302b3a1aea709aaca4b781c5252fcb812a17ab6275a9a484/pyarrow-21.0.0-cp313-cp313-macosx_12_0_x86_64.whl", hash = "sha256:d2fe8e7f3ce329a71b7ddd7498b3cfac0eeb200c2789bd840234f0dc271a8efe", size = 32680622, upload-time = "2025-07-18T00:56:07.505Z" }, + { url = "https://files.pythonhosted.org/packages/84/52/79095d73a742aa0aba370c7942b1b655f598069489ab387fe47261a849e1/pyarrow-21.0.0-cp313-cp313-manylinux_2_28_aarch64.whl", hash = "sha256:f522e5709379d72fb3da7785aa489ff0bb87448a9dc5a75f45763a795a089ebd", size = 41104094, upload-time = "2025-07-18T00:56:10.994Z" }, + { url = "https://files.pythonhosted.org/packages/89/4b/7782438b551dbb0468892a276b8c789b8bbdb25ea5c5eb27faadd753e037/pyarrow-21.0.0-cp313-cp313-manylinux_2_28_x86_64.whl", hash = "sha256:69cbbdf0631396e9925e048cfa5bce4e8c3d3b41562bbd70c685a8eb53a91e61", size = 42825576, upload-time = "2025-07-18T00:56:15.569Z" }, + { url = "https://files.pythonhosted.org/packages/b3/62/0f29de6e0a1e33518dec92c65be0351d32d7ca351e51ec5f4f837a9aab91/pyarrow-21.0.0-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:731c7022587006b755d0bdb27626a1a3bb004bb56b11fb30d98b6c1b4718579d", size = 43368342, upload-time = "2025-07-18T00:56:19.531Z" }, + { url = "https://files.pythonhosted.org/packages/90/c7/0fa1f3f29cf75f339768cc698c8ad4ddd2481c1742e9741459911c9ac477/pyarrow-21.0.0-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:dc56bc708f2d8ac71bd1dcb927e458c93cec10b98eb4120206a4091db7b67b99", size = 45131218, upload-time = "2025-07-18T00:56:23.347Z" }, + { url = "https://files.pythonhosted.org/packages/01/63/581f2076465e67b23bc5a37d4a2abff8362d389d29d8105832e82c9c811c/pyarrow-21.0.0-cp313-cp313-win_amd64.whl", hash = "sha256:186aa00bca62139f75b7de8420f745f2af12941595bbbfa7ed3870ff63e25636", size = 26087551, upload-time = "2025-07-18T00:56:26.758Z" }, + { url = "https://files.pythonhosted.org/packages/c9/ab/357d0d9648bb8241ee7348e564f2479d206ebe6e1c47ac5027c2e31ecd39/pyarrow-21.0.0-cp313-cp313t-macosx_12_0_arm64.whl", hash = "sha256:a7a102574faa3f421141a64c10216e078df467ab9576684d5cd696952546e2da", size = 31290064, upload-time = "2025-07-18T00:56:30.214Z" }, + { url = "https://files.pythonhosted.org/packages/3f/8a/5685d62a990e4cac2043fc76b4661bf38d06efed55cf45a334b455bd2759/pyarrow-21.0.0-cp313-cp313t-macosx_12_0_x86_64.whl", hash = "sha256:1e005378c4a2c6db3ada3ad4c217b381f6c886f0a80d6a316fe586b90f77efd7", size = 32727837, upload-time = "2025-07-18T00:56:33.935Z" }, + { url = "https://files.pythonhosted.org/packages/fc/de/c0828ee09525c2bafefd3e736a248ebe764d07d0fd762d4f0929dbc516c9/pyarrow-21.0.0-cp313-cp313t-manylinux_2_28_aarch64.whl", hash = "sha256:65f8e85f79031449ec8706b74504a316805217b35b6099155dd7e227eef0d4b6", size = 41014158, upload-time = "2025-07-18T00:56:37.528Z" }, + { url = "https://files.pythonhosted.org/packages/6e/26/a2865c420c50b7a3748320b614f3484bfcde8347b2639b2b903b21ce6a72/pyarrow-21.0.0-cp313-cp313t-manylinux_2_28_x86_64.whl", hash = "sha256:3a81486adc665c7eb1a2bde0224cfca6ceaba344a82a971ef059678417880eb8", size = 42667885, upload-time = "2025-07-18T00:56:41.483Z" }, + { url = "https://files.pythonhosted.org/packages/0a/f9/4ee798dc902533159250fb4321267730bc0a107d8c6889e07c3add4fe3a5/pyarrow-21.0.0-cp313-cp313t-musllinux_1_2_aarch64.whl", hash = "sha256:fc0d2f88b81dcf3ccf9a6ae17f89183762c8a94a5bdcfa09e05cfe413acf0503", size = 43276625, upload-time = "2025-07-18T00:56:48.002Z" }, + { url = "https://files.pythonhosted.org/packages/5a/da/e02544d6997037a4b0d22d8e5f66bc9315c3671371a8b18c79ade1cefe14/pyarrow-21.0.0-cp313-cp313t-musllinux_1_2_x86_64.whl", hash = "sha256:6299449adf89df38537837487a4f8d3bd91ec94354fdd2a7d30bc11c48ef6e79", size = 44951890, upload-time = "2025-07-18T00:56:52.568Z" }, + { url = "https://files.pythonhosted.org/packages/e5/4e/519c1bc1876625fe6b71e9a28287c43ec2f20f73c658b9ae1d485c0c206e/pyarrow-21.0.0-cp313-cp313t-win_amd64.whl", hash = "sha256:222c39e2c70113543982c6b34f3077962b44fca38c0bd9e68bb6781534425c10", size = 26371006, upload-time = "2025-07-18T00:56:56.379Z" }, +] + [[package]] name = "pyasn1" version = "0.6.1" @@ -2019,6 +2148,19 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/6f/9a/e73262f6c6656262b5fdd723ad90f518f579b7bc8622e43a942eec53c938/pydantic_core-2.33.2-cp313-cp313t-win_amd64.whl", hash = "sha256:c2fc0a768ef76c15ab9238afa6da7f69895bb5d1ee83aeea2e3509af4472d0b9", size = 1935777, upload-time = "2025-04-23T18:32:25.088Z" }, ] +[[package]] +name = "pydeck" +version = "0.9.1" +source = { registry = "https://pypi.org/simple" } +dependencies = [ + { name = "jinja2" }, + { name = "numpy" }, +] +sdist = { url = "https://files.pythonhosted.org/packages/a1/ca/40e14e196864a0f61a92abb14d09b3d3da98f94ccb03b49cf51688140dab/pydeck-0.9.1.tar.gz", hash = "sha256:f74475ae637951d63f2ee58326757f8d4f9cd9f2a457cf42950715003e2cb605", size = 3832240, upload-time = "2024-05-10T15:36:21.153Z" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/ab/4c/b888e6cf58bd9db9c93f40d1c6be8283ff49d88919231afe93a6bcf61626/pydeck-0.9.1-py2.py3-none-any.whl", hash = "sha256:b3f75ba0d273fc917094fa61224f3f6076ca8752b93d46faf3bcfd9f9d59b038", size = 6900403, upload-time = "2024-05-10T15:36:17.36Z" }, +] + [[package]] name = "pygments" version = "2.19.1" @@ -2083,19 +2225,12 @@ wheels = [ ] [[package]] -name = "pytorch-triton-xpu" -version = "3.3.0" -source = { registry = "https://download.pytorch.org/whl/xpu" } -dependencies = [ - { name = "setuptools", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, -] +name = "pytz" +version = "2025.2" +source = { registry = "https://pypi.org/simple" } +sdist = { url = "https://files.pythonhosted.org/packages/f8/bf/abbd3cdfb8fbc7fb3d4d38d320f2441b1e7cbe29be4f23797b4a2b5d8aac/pytz-2025.2.tar.gz", hash = "sha256:360b9e3dbb49a209c21ad61809c7fb453643e048b38924c765813546746e81c3", size = 320884, upload-time = "2025-03-25T02:25:00.538Z" } wheels = [ - { url = "https://download.pytorch.org/whl/pytorch_triton_xpu-3.3.0-cp312-cp312-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:40f6fb65b345dc9a61813abe7ac9a585f2c9808f414d140cc2a5f11f53ee063c" }, - { url = "https://download.pytorch.org/whl/pytorch_triton_xpu-3.3.0-cp312-cp312-win_amd64.whl", hash = "sha256:0dd07e6d5b872e42e48f5ee140e609d4554ca3cc509d5bf509ac232267cf358e" }, - { url = "https://download.pytorch.org/whl/pytorch_triton_xpu-3.3.0-cp313-cp313-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:b22b4c02ec71b4bfc862ae3cdfd2871dc0b05d2b1802f5db2196e0f897d581e9" }, - { url = "https://download.pytorch.org/whl/pytorch_triton_xpu-3.3.0-cp313-cp313-win_amd64.whl", hash = "sha256:a936a18182d8e065a9933afc9a3ebbffadd38604969f87c493831214539fc027" }, - { url = "https://download.pytorch.org/whl/pytorch_triton_xpu-3.3.0-cp313-cp313t-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:9821fe059de58e827ffc6aa10d69369b16c2f8c2a988b86bef9c2c6e396ab3aa" }, - { url = "https://download.pytorch.org/whl/pytorch_triton_xpu-3.3.0-cp313-cp313t-win_amd64.whl", hash = "sha256:07c18df9202c4dd30096ba22e36335cd5db827e83f110091b763fbd066498f3e" }, + { url = "https://files.pythonhosted.org/packages/81/c4/34e93fe5f5429d7570ec1fa436f1986fb1f00c3e0f43a589fe2bbcd22c3f/pytz-2025.2-py2.py3-none-any.whl", hash = "sha256:5ddf76296dd8c44c26eb8f4b6f35488f3ccbf6fbbd7adee0b7262d43f0ec2f00", size = 509225, upload-time = "2025-03-25T02:24:58.468Z" }, ] [[package]] @@ -2189,26 +2324,6 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/05/4c/bf3cad0d64c3214ac881299c4562b815f05d503bccc513e3fd4fdc6f67e4/pyzmq-26.4.0-cp313-cp313t-musllinux_1_1_x86_64.whl", hash = "sha256:26a2a7451606b87f67cdeca2c2789d86f605da08b4bd616b1a9981605ca3a364", size = 1395540, upload-time = "2025-04-04T12:04:30.562Z" }, ] -[[package]] -name = "qwen-vl-utils" -version = "0.0.11" -source = { registry = "https://pypi.org/simple" } -dependencies = [ - { name = "av" }, - { name = "packaging" }, - { name = "pillow" }, - { name = "requests" }, -] -sdist = { url = "https://files.pythonhosted.org/packages/42/9f/1229a40ebd49f689a0252144126f3865f31bb4151e942cf781a2936f0c4d/qwen_vl_utils-0.0.11.tar.gz", hash = "sha256:083ba1e5cfa5002165b1e3bddd4d6d26d1d6d34473884033ef12ae3fe8496cd5", size = 7924, upload-time = "2025-04-21T10:38:47.461Z" } -wheels = [ - { url = "https://files.pythonhosted.org/packages/0a/c2/ad7f93e1eea4ea0aefd1cc6fbe7a7095fd2f03a4d8fe2c3707e612b0866e/qwen_vl_utils-0.0.11-py3-none-any.whl", hash = "sha256:7fd5287ac04d6c1f01b93bf053b0be236a35149e414c9e864e3cc5bf2fe8cb7b", size = 7584, upload-time = "2025-04-21T10:38:45.595Z" }, -] - -[package.optional-dependencies] -decord = [ - { name = "decord" }, -] - [[package]] name = "referencing" version = "0.36.2" @@ -2490,8 +2605,7 @@ dependencies = [ { name = "pillow" }, { name = "scikit-learn" }, { name = "scipy" }, - { name = "torch", version = "2.7.0", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform != 'linux' and sys_platform != 'win32'" }, - { name = "torch", version = "2.7.0+xpu", source = { registry = "https://download.pytorch.org/whl/xpu" }, marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, + { name = "torch" }, { name = "tqdm" }, { name = "transformers" }, { name = "typing-extensions" }, @@ -2528,6 +2642,15 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/b7/ce/149a00dd41f10bc29e5921b496af8b574d8413afcd5e30dfa0ed46c2cc5e/six-1.17.0-py2.py3-none-any.whl", hash = "sha256:4721f391ed90541fddacab5acf947aa0d3dc7d27b2e1e8eda2be8970586c3274", size = 11050, upload-time = "2024-12-04T17:35:26.475Z" }, ] +[[package]] +name = "smmap" +version = "5.0.2" +source = { registry = "https://pypi.org/simple" } +sdist = { url = "https://files.pythonhosted.org/packages/44/cd/a040c4b3119bbe532e5b0732286f805445375489fceaec1f48306068ee3b/smmap-5.0.2.tar.gz", hash = "sha256:26ea65a03958fa0c8a1c7e8c7a58fdc77221b8910f6be2131affade476898ad5", size = 22329, upload-time = "2025-01-02T07:14:40.909Z" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/04/be/d09147ad1ec7934636ad912901c5fd7667e1c858e19d355237db0d0cd5e4/smmap-5.0.2-py3-none-any.whl", hash = "sha256:b30115f0def7d7531d22a0fb6502488d879e75b260a9db4d0819cfb25403af5e", size = 24303, upload-time = "2025-01-02T07:14:38.724Z" }, +] + [[package]] name = "sniffio" version = "1.3.1" @@ -2561,24 +2684,44 @@ wheels = [ ] [[package]] -name = "sympy" -version = "1.14.0" +name = "streamlit" +version = "1.51.0" source = { registry = "https://pypi.org/simple" } dependencies = [ - { name = "mpmath" }, + { name = "altair" }, + { name = "blinker" }, + { name = "cachetools" }, + { name = "click" }, + { name = "gitpython" }, + { name = "numpy" }, + { name = "packaging" }, + { name = "pandas" }, + { name = "pillow" }, + { name = "protobuf" }, + { name = "pyarrow" }, + { name = "pydeck" }, + { name = "requests" }, + { name = "tenacity" }, + { name = "toml" }, + { name = "tornado" }, + { name = "typing-extensions" }, + { name = "watchdog", marker = "sys_platform != 'darwin'" }, ] -sdist = { url = "https://files.pythonhosted.org/packages/83/d3/803453b36afefb7c2bb238361cd4ae6125a569b4db67cd9e79846ba2d68c/sympy-1.14.0.tar.gz", hash = "sha256:d3d3fe8df1e5a0b42f0e7bdf50541697dbe7d23746e894990c030e2b05e72517", size = 7793921, upload-time = "2025-04-27T18:05:01.611Z" } +sdist = { url = "https://files.pythonhosted.org/packages/59/6d/327ddd5fc35fcf2aeecb4040668337f5565a1c6c95b1e892b8bfd4bb9031/streamlit-1.51.0.tar.gz", hash = "sha256:1e742a9c0b698f466c6f5bf58d333beda5a1fbe8de660743976791b5c1446ef6", size = 9742904, upload-time = "2025-10-29T17:07:39.082Z" } wheels = [ - { url = "https://files.pythonhosted.org/packages/a2/09/77d55d46fd61b4a135c444fc97158ef34a095e5681d0a6c10b75bf356191/sympy-1.14.0-py3-none-any.whl", hash = "sha256:e091cc3e99d2141a0ba2847328f5479b05d94a6635cb96148ccb3f34671bd8f5", size = 6299353, upload-time = "2025-04-27T18:04:59.103Z" }, + { url = "https://files.pythonhosted.org/packages/39/60/868371b6482ccd9ef423c6f62650066cf8271fdb2ee84f192695ad6b7a96/streamlit-1.51.0-py3-none-any.whl", hash = "sha256:4008b029f71401ce54946bb09a6a3e36f4f7652cbb48db701224557738cfda38", size = 10171702, upload-time = "2025-10-29T17:07:35.97Z" }, ] [[package]] -name = "tcmlib" -version = "1.2.0" +name = "sympy" +version = "1.14.0" source = { registry = "https://pypi.org/simple" } +dependencies = [ + { name = "mpmath" }, +] +sdist = { url = "https://files.pythonhosted.org/packages/83/d3/803453b36afefb7c2bb238361cd4ae6125a569b4db67cd9e79846ba2d68c/sympy-1.14.0.tar.gz", hash = "sha256:d3d3fe8df1e5a0b42f0e7bdf50541697dbe7d23746e894990c030e2b05e72517", size = 7793921, upload-time = "2025-04-27T18:05:01.611Z" } wheels = [ - { url = "https://files.pythonhosted.org/packages/4d/6e/e9544e6ddb3640e92d9937689e9e33018503ddbc069eeb2e6a7581870591/tcmlib-1.2.0-py2.py3-none-manylinux_2_28_x86_64.whl", hash = "sha256:dee9a0665ffa0a74f0ec72844ef7d82e9178ebf6980a76ac65906303d5ed4d03", size = 4160997, upload-time = "2024-10-25T10:59:37.067Z" }, - { url = "https://files.pythonhosted.org/packages/5b/c8/c2a7bb169e21521a5bc82d955b30a064e266ab72485ac2dc33cd6ad153ea/tcmlib-1.2.0-py2.py3-none-win_amd64.whl", hash = "sha256:f751e005fd815ed0efeb87d4523f6a0938c5671e59ac935614f42d8ebb6489c9", size = 338379, upload-time = "2024-10-25T10:59:32.959Z" }, + { url = "https://files.pythonhosted.org/packages/a2/09/77d55d46fd61b4a135c444fc97158ef34a095e5681d0a6c10b75bf356191/sympy-1.14.0-py3-none-any.whl", hash = "sha256:e091cc3e99d2141a0ba2847328f5479b05d94a6635cb96148ccb3f34671bd8f5", size = 6299353, upload-time = "2025-04-27T18:04:59.103Z" }, ] [[package]] @@ -2596,7 +2739,7 @@ version = "0.18.1" source = { registry = "https://pypi.org/simple" } dependencies = [ { name = "ptyprocess", marker = "os_name != 'nt'" }, - { name = "pywinpty", marker = "os_name == 'nt' and sys_platform != 'linux'" }, + { name = "pywinpty", marker = "os_name == 'nt'" }, { name = "tornado" }, ] sdist = { url = "https://files.pythonhosted.org/packages/8a/11/965c6fd8e5cc254f1fe142d547387da17a8ebfd75a3455f637c663fb38a0/terminado-0.18.1.tar.gz", hash = "sha256:de09f2c4b85de4765f7714688fff57d3e75bad1f909b589fde880460c753fd2e", size = 32701, upload-time = "2024-03-12T14:34:39.026Z" } @@ -2651,112 +2794,55 @@ wheels = [ ] [[package]] -name = "torch" -version = "2.7.0" +name = "toml" +version = "0.10.2" source = { registry = "https://pypi.org/simple" } -resolution-markers = [ - "python_full_version >= '3.13' and sys_platform != 'linux' and sys_platform != 'win32'", - "python_full_version < '3.13' and sys_platform != 'linux' and sys_platform != 'win32'", -] -dependencies = [ - { name = "filelock", marker = "sys_platform != 'linux' and sys_platform != 'win32'" }, - { name = "fsspec", marker = "sys_platform != 'linux' and sys_platform != 'win32'" }, - { name = "jinja2", marker = "sys_platform != 'linux' and sys_platform != 'win32'" }, - { name = "networkx", marker = "sys_platform != 'linux' and sys_platform != 'win32'" }, - { name = "setuptools", marker = "sys_platform != 'linux' and sys_platform != 'win32'" }, - { name = "sympy", marker = "sys_platform != 'linux' and sys_platform != 'win32'" }, - { name = "typing-extensions", marker = "sys_platform != 'linux' and sys_platform != 'win32'" }, -] +sdist = { url = "https://files.pythonhosted.org/packages/be/ba/1f744cdc819428fc6b5084ec34d9b30660f6f9daaf70eead706e3203ec3c/toml-0.10.2.tar.gz", hash = "sha256:b3bda1d108d5dd99f4a20d24d9c348e91c4db7ab1b749200bded2f839ccbe68f", size = 22253, upload-time = "2020-11-01T01:40:22.204Z" } wheels = [ - { url = "https://files.pythonhosted.org/packages/ee/8d/b2939e5254be932db1a34b2bd099070c509e8887e0c5a90c498a917e4032/torch-2.7.0-cp312-none-macosx_11_0_arm64.whl", hash = "sha256:30b7688a87239a7de83f269333651d8e582afffce6f591fff08c046f7787296e", size = 68574294, upload-time = "2025-04-23T14:34:47.098Z" }, - { url = "https://files.pythonhosted.org/packages/28/fd/74ba6fde80e2b9eef4237fe668ffae302c76f0e4221759949a632ca13afa/torch-2.7.0-cp313-cp313t-macosx_14_0_arm64.whl", hash = "sha256:edad98dddd82220465b106506bb91ee5ce32bd075cddbcf2b443dfaa2cbd83bf", size = 68856166, upload-time = "2025-04-23T14:34:04.012Z" }, - { url = "https://files.pythonhosted.org/packages/90/48/7e6477cf40d48cc0a61fa0d41ee9582b9a316b12772fcac17bc1a40178e7/torch-2.7.0-cp313-none-macosx_11_0_arm64.whl", hash = "sha256:27f5007bdf45f7bb7af7f11d1828d5c2487e030690afb3d89a651fd7036a390e", size = 68575074, upload-time = "2025-04-23T14:32:38.136Z" }, + { url = "https://files.pythonhosted.org/packages/44/6f/7120676b6d73228c96e17f1f794d8ab046fc910d781c8d151120c3f1569e/toml-0.10.2-py2.py3-none-any.whl", hash = "sha256:806143ae5bfb6a3c6e736a764057db0e6a0e05e338b5630894a5f779cabb4f9b", size = 16588, upload-time = "2020-11-01T01:40:20.672Z" }, ] [[package]] name = "torch" -version = "2.7.0+xpu" -source = { registry = "https://download.pytorch.org/whl/xpu" } -resolution-markers = [ - "python_full_version >= '3.13' and sys_platform == 'linux'", - "python_full_version < '3.13' and sys_platform == 'linux'", - "python_full_version >= '3.13' and sys_platform == 'win32'", - "python_full_version < '3.13' and sys_platform == 'win32'", -] -dependencies = [ - { name = "filelock", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "fsspec", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "intel-cmplr-lib-rt", version = "2025.0.4", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'linux'" }, - { name = "intel-cmplr-lib-rt", version = "2025.0.5", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'win32'" }, - { name = "intel-cmplr-lib-ur", version = "2025.0.4", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'linux'" }, - { name = "intel-cmplr-lib-ur", version = "2025.0.5", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'win32'" }, - { name = "intel-cmplr-lic-rt", version = "2025.0.4", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'linux'" }, - { name = "intel-cmplr-lic-rt", version = "2025.0.5", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'win32'" }, - { name = "intel-pti", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "intel-sycl-rt", version = "2025.0.4", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'linux'" }, - { name = "intel-sycl-rt", version = "2025.0.5", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform == 'win32'" }, - { name = "jinja2", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "networkx", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "pytorch-triton-xpu", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "setuptools", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "sympy", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "tcmlib", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "typing-extensions", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "umf", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, -] -wheels = [ - { url = "https://download.pytorch.org/whl/xpu/torch-2.7.0%2Bxpu-cp312-cp312-linux_x86_64.whl", hash = "sha256:c806d44aa2ca5d225629f6fbc6c994d5deaac2d2cde449195bc8e3522ddd219a" }, - { url = "https://download.pytorch.org/whl/xpu/torch-2.7.0%2Bxpu-cp312-cp312-win_amd64.whl", hash = "sha256:94739e665d9b4d5cd7af5f517cb6103f6f9fb421c095184609653a24524040f5" }, - { url = "https://download.pytorch.org/whl/xpu/torch-2.7.0%2Bxpu-cp313-cp313-linux_x86_64.whl", hash = "sha256:25d8277b7f01d42e2e014ccbab57a2692b6ec4eff8dcf894eda1b297407cf97a" }, - { url = "https://download.pytorch.org/whl/xpu/torch-2.7.0%2Bxpu-cp313-cp313-win_amd64.whl", hash = "sha256:31df3cb674918e89bc8c532baa331dc84f4430e1f9c0ec379232db44cba78355" }, - { url = "https://download.pytorch.org/whl/xpu/torch-2.7.0%2Bxpu-cp313-cp313t-linux_x86_64.whl", hash = "sha256:f853aa4e926102a11a8522f415e53da39b7e431b7922835f62e8a71e33f7e7dd" }, - { url = "https://download.pytorch.org/whl/xpu/torch-2.7.0%2Bxpu-cp313-cp313t-win_amd64.whl", hash = "sha256:cc286e5042fb0f628b2fdf79f570861e9340e6cc19f3e6a2ca27ce44e6fffbaf" }, -] - -[[package]] -name = "torchvision" -version = "0.22.0" +version = "2.7.0" source = { registry = "https://pypi.org/simple" } -resolution-markers = [ - "python_full_version >= '3.13' and sys_platform != 'linux' and sys_platform != 'win32'", - "python_full_version < '3.13' and sys_platform != 'linux' and sys_platform != 'win32'", -] -dependencies = [ - { name = "numpy", marker = "sys_platform != 'linux' and sys_platform != 'win32'" }, - { name = "pillow", marker = "sys_platform != 'linux' and sys_platform != 'win32'" }, - { name = "torch", version = "2.7.0", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform != 'linux' and sys_platform != 'win32'" }, -] -wheels = [ - { url = "https://files.pythonhosted.org/packages/cb/ea/887d1d61cf4431a46280972de665f350af1898ce5006cd046326e5d0a2f2/torchvision-0.22.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:31c3165418fe21c3d81fe3459e51077c2f948801b8933ed18169f54652796a0f", size = 1947826, upload-time = "2025-04-23T14:41:59.188Z" }, - { url = "https://files.pythonhosted.org/packages/e1/2a/9b34685599dcb341d12fc2730055155623db7a619d2415a8d31f17050952/torchvision-0.22.0-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:ece17995857dd328485c9c027c0b20ffc52db232e30c84ff6c95ab77201112c5", size = 1947823, upload-time = "2025-04-23T14:41:39.956Z" }, - { url = "https://files.pythonhosted.org/packages/6f/a7/f43e9c8d13118b4ffbaebea664c9338ab20fa115a908125afd2238ff16e7/torchvision-0.22.0-cp313-cp313t-macosx_11_0_arm64.whl", hash = "sha256:cdc96daa4658b47ce9384154c86ed1e70cba9d972a19f5de6e33f8f94a626790", size = 2137621, upload-time = "2025-04-23T14:41:51.427Z" }, -] - -[[package]] -name = "torchvision" -version = "0.22.0+xpu" -source = { registry = "https://download.pytorch.org/whl/xpu" } -resolution-markers = [ - "python_full_version >= '3.13' and sys_platform == 'linux'", - "python_full_version < '3.13' and sys_platform == 'linux'", - "python_full_version >= '3.13' and sys_platform == 'win32'", - "python_full_version < '3.13' and sys_platform == 'win32'", -] dependencies = [ - { name = "numpy", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "pillow", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "torch", version = "2.7.0+xpu", source = { registry = "https://download.pytorch.org/whl/xpu" }, marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, + { name = "filelock" }, + { name = "fsspec" }, + { name = "jinja2" }, + { name = "networkx" }, + { name = "nvidia-cublas-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "nvidia-cuda-cupti-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "nvidia-cuda-nvrtc-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "nvidia-cuda-runtime-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "nvidia-cudnn-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "nvidia-cufft-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "nvidia-cufile-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "nvidia-curand-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "nvidia-cusolver-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "nvidia-cusparse-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "nvidia-cusparselt-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "nvidia-nccl-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "nvidia-nvjitlink-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "nvidia-nvtx-cu12", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "setuptools" }, + { name = "sympy" }, + { name = "triton", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" }, + { name = "typing-extensions" }, ] wheels = [ - { url = "https://download.pytorch.org/whl/xpu/torchvision-0.22.0%2Bxpu-cp312-cp312-linux_x86_64.whl", hash = "sha256:b7686d566dd17f5304f52e4a8371c2d8cb7b80edc75e64ea55da82eb33cdef26" }, - { url = "https://download.pytorch.org/whl/xpu/torchvision-0.22.0%2Bxpu-cp312-cp312-manylinux_2_28_x86_64.whl", hash = "sha256:c070dc5f1bb664c2d4a25175d21968ad01cabed26d82d1880a4642795ee958f0" }, - { url = "https://download.pytorch.org/whl/xpu/torchvision-0.22.0%2Bxpu-cp312-cp312-win_amd64.whl", hash = "sha256:544264f62530b8d7564399ec2b72841045bfd872638646e764303b4e62a93516" }, - { url = "https://download.pytorch.org/whl/xpu/torchvision-0.22.0%2Bxpu-cp313-cp313-linux_x86_64.whl", hash = "sha256:2b14385884e80c9d92bcdb3d91429157044548b38f1b4784f60065c3d93d0582" }, - { url = "https://download.pytorch.org/whl/xpu/torchvision-0.22.0%2Bxpu-cp313-cp313-manylinux_2_28_x86_64.whl", hash = "sha256:73121c18fbd45a1dee9e05a2cec98c067602862433846472ff69b379bccd0ed5" }, - { url = "https://download.pytorch.org/whl/xpu/torchvision-0.22.0%2Bxpu-cp313-cp313-win_amd64.whl", hash = "sha256:ea3a5854452ab41961cf2e223ccc955b8f7018b6e92ef85ced9f923963c315b8" }, - { url = "https://download.pytorch.org/whl/xpu/torchvision-0.22.0%2Bxpu-cp313-cp313t-linux_x86_64.whl", hash = "sha256:5df2f7bfc497cc0138e8b6996bff99e8fcd60f9571e7022be30f16ca54bae33b" }, - { url = "https://download.pytorch.org/whl/xpu/torchvision-0.22.0%2Bxpu-cp313-cp313t-manylinux_2_28_x86_64.whl", hash = "sha256:6d5aa0a6d19a860ab31d72874640ab5696d4792e82aa60b0bb19a43addf4fcdc" }, - { url = "https://download.pytorch.org/whl/xpu/torchvision-0.22.0%2Bxpu-cp313-cp313t-win_amd64.whl", hash = "sha256:31c075b44af2a1cb100b09c683a82521d9a057dc8874023800d8fcedc603dee1" }, + { url = "https://files.pythonhosted.org/packages/aa/5e/ac759f4c0ab7c01feffa777bd68b43d2ac61560a9770eeac074b450f81d4/torch-2.7.0-cp312-cp312-manylinux_2_28_aarch64.whl", hash = "sha256:36a6368c7ace41ad1c0f69f18056020b6a5ca47bedaca9a2f3b578f5a104c26c", size = 99013250, upload-time = "2025-04-23T14:35:15.589Z" }, + { url = "https://files.pythonhosted.org/packages/9c/58/2d245b6f1ef61cf11dfc4aceeaacbb40fea706ccebac3f863890c720ab73/torch-2.7.0-cp312-cp312-manylinux_2_28_x86_64.whl", hash = "sha256:15aab3e31c16feb12ae0a88dba3434a458874636f360c567caa6a91f6bfba481", size = 865042157, upload-time = "2025-04-23T14:32:56.011Z" }, + { url = "https://files.pythonhosted.org/packages/44/80/b353c024e6b624cd9ce1d66dcb9d24e0294680f95b369f19280e241a0159/torch-2.7.0-cp312-cp312-win_amd64.whl", hash = "sha256:f56d4b2510934e072bab3ab8987e00e60e1262fb238176168f5e0c43a1320c6d", size = 212482262, upload-time = "2025-04-23T14:35:03.527Z" }, + { url = "https://files.pythonhosted.org/packages/ee/8d/b2939e5254be932db1a34b2bd099070c509e8887e0c5a90c498a917e4032/torch-2.7.0-cp312-none-macosx_11_0_arm64.whl", hash = "sha256:30b7688a87239a7de83f269333651d8e582afffce6f591fff08c046f7787296e", size = 68574294, upload-time = "2025-04-23T14:34:47.098Z" }, + { url = "https://files.pythonhosted.org/packages/14/24/720ea9a66c29151b315ea6ba6f404650834af57a26b2a04af23ec246b2d5/torch-2.7.0-cp313-cp313-manylinux_2_28_aarch64.whl", hash = "sha256:868ccdc11798535b5727509480cd1d86d74220cfdc42842c4617338c1109a205", size = 99015553, upload-time = "2025-04-23T14:34:41.075Z" }, + { url = "https://files.pythonhosted.org/packages/4b/27/285a8cf12bd7cd71f9f211a968516b07dcffed3ef0be585c6e823675ab91/torch-2.7.0-cp313-cp313-manylinux_2_28_x86_64.whl", hash = "sha256:9b52347118116cf3dff2ab5a3c3dd97c719eb924ac658ca2a7335652076df708", size = 865046389, upload-time = "2025-04-23T14:32:01.16Z" }, + { url = "https://files.pythonhosted.org/packages/74/c8/2ab2b6eadc45554af8768ae99668c5a8a8552e2012c7238ded7e9e4395e1/torch-2.7.0-cp313-cp313-win_amd64.whl", hash = "sha256:434cf3b378340efc87c758f250e884f34460624c0523fe5c9b518d205c91dd1b", size = 212490304, upload-time = "2025-04-23T14:33:57.108Z" }, + { url = "https://files.pythonhosted.org/packages/28/fd/74ba6fde80e2b9eef4237fe668ffae302c76f0e4221759949a632ca13afa/torch-2.7.0-cp313-cp313t-macosx_14_0_arm64.whl", hash = "sha256:edad98dddd82220465b106506bb91ee5ce32bd075cddbcf2b443dfaa2cbd83bf", size = 68856166, upload-time = "2025-04-23T14:34:04.012Z" }, + { url = "https://files.pythonhosted.org/packages/cb/b4/8df3f9fe6bdf59e56a0e538592c308d18638eb5f5dc4b08d02abb173c9f0/torch-2.7.0-cp313-cp313t-manylinux_2_28_aarch64.whl", hash = "sha256:2a885fc25afefb6e6eb18a7d1e8bfa01cc153e92271d980a49243b250d5ab6d9", size = 99091348, upload-time = "2025-04-23T14:33:48.975Z" }, + { url = "https://files.pythonhosted.org/packages/9d/f5/0bd30e9da04c3036614aa1b935a9f7e505a9e4f1f731b15e165faf8a4c74/torch-2.7.0-cp313-cp313t-manylinux_2_28_x86_64.whl", hash = "sha256:176300ff5bc11a5f5b0784e40bde9e10a35c4ae9609beed96b4aeb46a27f5fae", size = 865104023, upload-time = "2025-04-23T14:30:40.537Z" }, + { url = "https://files.pythonhosted.org/packages/d1/b7/2235d0c3012c596df1c8d39a3f4afc1ee1b6e318d469eda4c8bb68566448/torch-2.7.0-cp313-cp313t-win_amd64.whl", hash = "sha256:d0ca446a93f474985d81dc866fcc8dccefb9460a29a456f79d99c29a78a66993", size = 212750916, upload-time = "2025-04-23T14:32:22.91Z" }, + { url = "https://files.pythonhosted.org/packages/90/48/7e6477cf40d48cc0a61fa0d41ee9582b9a316b12772fcac17bc1a40178e7/torch-2.7.0-cp313-none-macosx_11_0_arm64.whl", hash = "sha256:27f5007bdf45f7bb7af7f11d1828d5c2487e030690afb3d89a651fd7036a390e", size = 68575074, upload-time = "2025-04-23T14:32:38.136Z" }, ] [[package]] @@ -2820,6 +2906,19 @@ wheels = [ { url = "https://files.pythonhosted.org/packages/5e/0c/68d03a38f6ab2ba2b2829eb11b334610dd236e7926787f7656001b68e1f2/transformers-4.53.0-py3-none-any.whl", hash = "sha256:7d8039ff032c01a2d7f8a8fe0066620367003275f023815a966e62203f9f5dd7", size = 10821970, upload-time = "2025-06-26T16:10:51.505Z" }, ] +[[package]] +name = "triton" +version = "3.3.0" +source = { registry = "https://pypi.org/simple" } +dependencies = [ + { name = "setuptools" }, +] +wheels = [ + { url = "https://files.pythonhosted.org/packages/11/53/ce18470914ab6cfbec9384ee565d23c4d1c55f0548160b1c7b33000b11fd/triton-3.3.0-cp312-cp312-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:b68c778f6c4218403a6bd01be7484f6dc9e20fe2083d22dd8aef33e3b87a10a3", size = 156504509, upload-time = "2025-04-09T20:27:40.413Z" }, + { url = "https://files.pythonhosted.org/packages/7d/74/4bf2702b65e93accaa20397b74da46fb7a0356452c1bb94dbabaf0582930/triton-3.3.0-cp313-cp313-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:47bc87ad66fa4ef17968299acacecaab71ce40a238890acc6ad197c3abe2b8f1", size = 156516468, upload-time = "2025-04-09T20:27:48.196Z" }, + { url = "https://files.pythonhosted.org/packages/0a/93/f28a696fa750b9b608baa236f8225dd3290e5aff27433b06143adc025961/triton-3.3.0-cp313-cp313t-manylinux_2_27_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:ce4700fc14032af1e049005ae94ba908e71cd6c2df682239aed08e49bc71b742", size = 156580729, upload-time = "2025-04-09T20:27:55.424Z" }, +] + [[package]] name = "typer" version = "0.16.0" @@ -2866,15 +2965,12 @@ wheels = [ ] [[package]] -name = "umf" -version = "0.9.1" +name = "tzdata" +version = "2025.2" source = { registry = "https://pypi.org/simple" } -dependencies = [ - { name = "tcmlib", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, -] +sdist = { url = "https://files.pythonhosted.org/packages/95/32/1a225d6164441be760d75c2c42e2780dc0873fe382da3e98a2e1e48361e5/tzdata-2025.2.tar.gz", hash = "sha256:b60a638fcc0daffadf82fe0f57e53d06bdec2f36c4df66280ae79bce6bd6f2b9", size = 196380, upload-time = "2025-03-23T13:54:43.652Z" } wheels = [ - { url = "https://files.pythonhosted.org/packages/4e/19/cef361ce4c5c1079f90d35ed853996f94cef5e68bc29b8e7d11a28b0c53b/umf-0.9.1-py2.py3-none-manylinux_2_28_x86_64.whl", hash = "sha256:2f7b8eb45e182b24823be420063799ea89b4f1cad6b9510b1fc6e04b809c7ec2", size = 161551, upload-time = "2024-11-19T15:35:00.583Z" }, - { url = "https://files.pythonhosted.org/packages/56/2a/3ccea66d7390f3b6407b396ec289d5acad7f8f92a1bd8b66b58d376fc019/umf-0.9.1-py2.py3-none-win_amd64.whl", hash = "sha256:9d1336d63c7a6b36af1f76dab942a760168da519a1bfe6941fc6418198b10820", size = 72212, upload-time = "2024-11-19T15:36:28.366Z" }, + { url = "https://files.pythonhosted.org/packages/5c/23/c7abc0ca0a1526a0774eca151daeb8de62ec457e77262b66b359c3c7679e/tzdata-2025.2-py2.py3-none-any.whl", hash = "sha256:1a403fada01ff9221ca8044d701868fa132215d84beb92242d9acd2147f667a8", size = 347839, upload-time = "2025-03-23T13:54:41.845Z" }, ] [[package]] @@ -2940,36 +3036,52 @@ wheels = [ ] [[package]] -name = "video-description-generation-query-retrieval" +name = "video-rag-ollama" version = "0.1.0" source = { virtual = "." } dependencies = [ { name = "chromadb" }, - { name = "huggingface-hub", extra = ["hf-xet"] }, + { name = "ipykernel" }, + { name = "ipywidgets" }, { name = "jupyter" }, - { name = "pytorch-triton-xpu", marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "qwen-vl-utils", extra = ["decord"] }, + { name = "numpy" }, + { name = "ollama" }, + { name = "opencv-python" }, { name = "sentence-transformers" }, - { name = "torch", version = "2.7.0", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform != 'linux' and sys_platform != 'win32'" }, - { name = "torch", version = "2.7.0+xpu", source = { registry = "https://download.pytorch.org/whl/xpu" }, marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "torchvision", version = "0.22.0", source = { registry = "https://pypi.org/simple" }, marker = "sys_platform != 'linux' and sys_platform != 'win32'" }, - { name = "torchvision", version = "0.22.0+xpu", source = { registry = "https://download.pytorch.org/whl/xpu" }, marker = "sys_platform == 'linux' or sys_platform == 'win32'" }, - { name = "transformers" }, + { name = "streamlit" }, + { name = "tqdm" }, ] [package.metadata] requires-dist = [ { name = "chromadb", specifier = ">=1.0.12" }, - { name = "huggingface-hub", extras = ["hf-xet"], specifier = ">=0.32.3" }, + { name = "ipykernel", specifier = ">=6.25.0" }, + { name = "ipywidgets", specifier = ">=8.1.0" }, { name = "jupyter", specifier = ">=1.1.1" }, - { name = "pytorch-triton-xpu", marker = "sys_platform == 'linux' or sys_platform == 'win32'", specifier = ">=3.3.0", index = "https://download.pytorch.org/whl/xpu" }, - { name = "qwen-vl-utils", extras = ["decord"], specifier = ">=0.0.11" }, + { name = "numpy", specifier = ">=1.24.0" }, + { name = "ollama", specifier = ">=0.4.0" }, + { name = "opencv-python", specifier = ">=4.8.0" }, { name = "sentence-transformers", specifier = ">=4.1.0" }, - { name = "torch", marker = "sys_platform != 'linux' and sys_platform != 'win32'", specifier = ">=2.7.0" }, - { name = "torch", marker = "sys_platform == 'linux' or sys_platform == 'win32'", specifier = ">=2.7.0", index = "https://download.pytorch.org/whl/xpu" }, - { name = "torchvision", marker = "sys_platform != 'linux' and sys_platform != 'win32'", specifier = ">=0.22.0" }, - { name = "torchvision", marker = "sys_platform == 'linux' or sys_platform == 'win32'", specifier = ">=0.22.0", index = "https://download.pytorch.org/whl/xpu" }, - { name = "transformers", specifier = ">=4.52.4" }, + { name = "streamlit", specifier = ">=1.30.0" }, + { name = "tqdm", specifier = ">=4.65.0" }, +] + +[[package]] +name = "watchdog" +version = "6.0.0" +source = { registry = "https://pypi.org/simple" } +sdist = { url = "https://files.pythonhosted.org/packages/db/7d/7f3d619e951c88ed75c6037b246ddcf2d322812ee8ea189be89511721d54/watchdog-6.0.0.tar.gz", hash = "sha256:9ddf7c82fda3ae8e24decda1338ede66e1c99883db93711d8fb941eaa2d8c282", size = 131220, upload-time = "2024-11-01T14:07:13.037Z" } +wheels = [ + { url = "https://files.pythonhosted.org/packages/a9/c7/ca4bf3e518cb57a686b2feb4f55a1892fd9a3dd13f470fca14e00f80ea36/watchdog-6.0.0-py3-none-manylinux2014_aarch64.whl", hash = "sha256:7607498efa04a3542ae3e05e64da8202e58159aa1fa4acddf7678d34a35d4f13", size = 79079, upload-time = "2024-11-01T14:06:59.472Z" }, + { url = "https://files.pythonhosted.org/packages/5c/51/d46dc9332f9a647593c947b4b88e2381c8dfc0942d15b8edc0310fa4abb1/watchdog-6.0.0-py3-none-manylinux2014_armv7l.whl", hash = "sha256:9041567ee8953024c83343288ccc458fd0a2d811d6a0fd68c4c22609e3490379", size = 79078, upload-time = "2024-11-01T14:07:01.431Z" }, + { url = "https://files.pythonhosted.org/packages/d4/57/04edbf5e169cd318d5f07b4766fee38e825d64b6913ca157ca32d1a42267/watchdog-6.0.0-py3-none-manylinux2014_i686.whl", hash = "sha256:82dc3e3143c7e38ec49d61af98d6558288c415eac98486a5c581726e0737c00e", size = 79076, upload-time = "2024-11-01T14:07:02.568Z" }, + { url = "https://files.pythonhosted.org/packages/ab/cc/da8422b300e13cb187d2203f20b9253e91058aaf7db65b74142013478e66/watchdog-6.0.0-py3-none-manylinux2014_ppc64.whl", hash = "sha256:212ac9b8bf1161dc91bd09c048048a95ca3a4c4f5e5d4a7d1b1a7d5752a7f96f", size = 79077, upload-time = "2024-11-01T14:07:03.893Z" }, + { url = "https://files.pythonhosted.org/packages/2c/3b/b8964e04ae1a025c44ba8e4291f86e97fac443bca31de8bd98d3263d2fcf/watchdog-6.0.0-py3-none-manylinux2014_ppc64le.whl", hash = "sha256:e3df4cbb9a450c6d49318f6d14f4bbc80d763fa587ba46ec86f99f9e6876bb26", size = 79078, upload-time = "2024-11-01T14:07:05.189Z" }, + { url = "https://files.pythonhosted.org/packages/62/ae/a696eb424bedff7407801c257d4b1afda455fe40821a2be430e173660e81/watchdog-6.0.0-py3-none-manylinux2014_s390x.whl", hash = "sha256:2cce7cfc2008eb51feb6aab51251fd79b85d9894e98ba847408f662b3395ca3c", size = 79077, upload-time = "2024-11-01T14:07:06.376Z" }, + { url = "https://files.pythonhosted.org/packages/b5/e8/dbf020b4d98251a9860752a094d09a65e1b436ad181faf929983f697048f/watchdog-6.0.0-py3-none-manylinux2014_x86_64.whl", hash = "sha256:20ffe5b202af80ab4266dcd3e91aae72bf2da48c0d33bdb15c66658e685e94e2", size = 79078, upload-time = "2024-11-01T14:07:07.547Z" }, + { url = "https://files.pythonhosted.org/packages/07/f6/d0e5b343768e8bcb4cda79f0f2f55051bf26177ecd5651f84c07567461cf/watchdog-6.0.0-py3-none-win32.whl", hash = "sha256:07df1fdd701c5d4c8e55ef6cf55b8f0120fe1aef7ef39a1c6fc6bc2e606d517a", size = 79065, upload-time = "2024-11-01T14:07:09.525Z" }, + { url = "https://files.pythonhosted.org/packages/db/d9/c495884c6e548fce18a8f40568ff120bc3a4b7b99813081c8ac0c936fa64/watchdog-6.0.0-py3-none-win_amd64.whl", hash = "sha256:cbafb470cf848d93b5d013e2ecb245d4aa1c8fd0504e863ccefa32445359d680", size = 79070, upload-time = "2024-11-01T14:07:10.686Z" }, + { url = "https://files.pythonhosted.org/packages/33/e8/e40370e6d74ddba47f002a32919d91310d6074130fe4e17dabcafc15cbf1/watchdog-6.0.0-py3-none-win_ia64.whl", hash = "sha256:a1914259fa9e1454315171103c6a30961236f508b9b623eae470268bbcc6a22f", size = 79067, upload-time = "2024-11-01T14:07:11.845Z" }, ] [[package]]