From a65634c2e11963773756d0a7e1c9daed04ac06f7 Mon Sep 17 00:00:00 2001
From: supmo668 <mymm.psu@gmail.com>
Date: Sun, 23 Nov 2025 19:21:55 -0800
Subject: [PATCH 1/2] fix: Handle EquivalentSchemaRuleAlreadyExists errors in
 Neo4j driver
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Fixes #1079

Neo4j 5.26+ throws EquivalentSchemaRuleAlreadyExists errors when
creating indices in parallel, even with IF NOT EXISTS clause.

This fix:
- Catches neo4j.exceptions.ClientError exceptions
- Checks for EquivalentSchemaRuleAlreadyExists error code
- Logs the occurrence as info instead of error
- Returns empty result to indicate success (index/constraint exists)

This prevents the MCP server from crashing on startup when multiple
CREATE INDEX IF NOT EXISTS queries run concurrently via semaphore_gather.

The solution follows the same pattern already implemented in the
FalkorDB driver for handling "already indexed" errors.

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 graphiti_core/driver/neo4j_driver.py | 10 ++++++++++
 1 file changed, 10 insertions(+)

diff --git a/graphiti_core/driver/neo4j_driver.py b/graphiti_core/driver/neo4j_driver.py
index 4fa73f575..c75ed82e7 100644
--- a/graphiti_core/driver/neo4j_driver.py
+++ b/graphiti_core/driver/neo4j_driver.py
@@ -18,6 +18,7 @@
 from collections.abc import Coroutine
 from typing import Any
 
+import neo4j.exceptions
 from neo4j import AsyncGraphDatabase, EagerResult
 from typing_extensions import LiteralString
 
@@ -70,6 +71,15 @@ async def execute_query(self, cypher_query_: LiteralString, **kwargs: Any) -> Ea
 
         try:
             result = await self.client.execute_query(cypher_query_, parameters_=params, **kwargs)
+        except neo4j.exceptions.ClientError as e:
+            # Handle race condition when creating indices/constraints in parallel
+            # Neo4j 5.26+ may throw EquivalentSchemaRuleAlreadyExists even with IF NOT EXISTS
+            if 'EquivalentSchemaRuleAlreadyExists' in str(e):
+                logger.info(f'Index or constraint already exists, continuing: {cypher_query_}')
+                # Return empty result to indicate success (index exists)
+                return EagerResult([], None, None)  # type: ignore
+            logger.error(f'Error executing Neo4j query: {e}\n{cypher_query_}\n{params}')
+            raise
         except Exception as e:
             logger.error(f'Error executing Neo4j query: {e}\n{cypher_query_}\n{params}')
             raise

From 74a422369c9f571521bb05011db526274ae8052b Mon Sep 17 00:00:00 2001
From: supmo668 <mymm.psu@gmail.com>
Date: Sun, 30 Nov 2025 23:47:38 -0800
Subject: [PATCH 2/2] feat: Add enhanced configuration system with
 multi-provider LLM support
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

This commit introduces a comprehensive configuration system that makes
Graphiti more flexible and easier to configure across different
providers and deployment environments.

## New Features

- **Unified Configuration**: New GraphitiConfig class with Pydantic validation
- **YAML Support**: Load configuration from .graphiti.yaml files
- **Multi-Provider Support**: Easy switching between OpenAI, Azure, Anthropic,
  Gemini, Groq, and LiteLLM
- **LiteLLM Integration**: Unified access to 100+ LLM providers
- **Factory Functions**: Automatic client creation from configuration
- **Full Backward Compatibility**: Existing code continues to work

## Configuration System

- graphiti_core/config/settings.py: Pydantic configuration classes
- graphiti_core/config/providers.py: Provider enumerations and defaults
- graphiti_core/config/factory.py: Factory functions for client creation

## LiteLLM Client

- graphiti_core/llm_client/litellm_client.py: New unified LLM client
- Support for Azure OpenAI, AWS Bedrock, Vertex AI, Ollama, vLLM, etc.
- Automatic structured output detection

## Documentation

- docs/CONFIGURATION.md: Comprehensive configuration guide
- examples/graphiti_config_example.yaml: Example configurations
- DOMAIN_AGNOSTIC_IMPROVEMENT_PLAN.md: Future improvement roadmap

## Tests

- tests/config/test_settings.py: 22 tests for configuration
- tests/config/test_factory.py: 12 tests for factories
- 33/34 tests passing (97%)

## Issues Addressed

- #1004: Azure OpenAI support
- #1006: Azure OpenAI reranker support
- #1007: vLLM/OpenAI-compatible provider stability
- #1074: Ollama embeddings support
- #995: Docker Azure OpenAI support

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>
---
 DOMAIN_AGNOSTIC_IMPROVEMENT_PLAN.md        | 749 +++++++++++++++++++++
 PR_DESCRIPTION.md                          | 169 +++++
 TODOs.md                                   |  73 ++
 docs/CONFIGURATION.md                      | 409 +++++++++++
 examples/graphiti_config_example.yaml      |  83 +++
 graphiti_core/config/__init__.py           |  34 +
 graphiti_core/config/factory.py            | 321 +++++++++
 graphiti_core/config/providers.py          | 100 +++
 graphiti_core/config/settings.py           | 459 +++++++++++++
 graphiti_core/graphiti.py                  | 143 +++-
 graphiti_core/llm_client/litellm_client.py | 267 ++++++++
 pyproject.toml                             |   4 +-
 tests/config/test_factory.py               | 189 ++++++
 tests/config/test_settings.py              | 261 +++++++
 uv.lock                                    | 171 ++++-
 15 files changed, 3399 insertions(+), 33 deletions(-)
 create mode 100644 DOMAIN_AGNOSTIC_IMPROVEMENT_PLAN.md
 create mode 100644 PR_DESCRIPTION.md
 create mode 100644 TODOs.md
 create mode 100644 docs/CONFIGURATION.md
 create mode 100644 examples/graphiti_config_example.yaml
 create mode 100644 graphiti_core/config/__init__.py
 create mode 100644 graphiti_core/config/factory.py
 create mode 100644 graphiti_core/config/providers.py
 create mode 100644 graphiti_core/config/settings.py
 create mode 100644 graphiti_core/llm_client/litellm_client.py
 create mode 100644 tests/config/test_factory.py
 create mode 100644 tests/config/test_settings.py

diff --git a/DOMAIN_AGNOSTIC_IMPROVEMENT_PLAN.md b/DOMAIN_AGNOSTIC_IMPROVEMENT_PLAN.md
new file mode 100644
index 000000000..49d0730d2
--- /dev/null
+++ b/DOMAIN_AGNOSTIC_IMPROVEMENT_PLAN.md
@@ -0,0 +1,749 @@
+# Graphiti Domain-Agnostic Improvement Plan
+
+**Date**: 2025-11-30
+**Status**: Draft
+**Last Pull**: `422558d` (main branch)
+
+---
+
+## Executive Summary
+
+This document outlines a strategic plan to make Graphiti more domain-agnostic and adaptable to diverse use cases beyond conversational AI. The current architecture, while powerful, contains several domain-specific assumptions (primarily around messaging/conversational data) that limit its applicability to other domains such as scientific research, legal documents, IoT data, healthcare records, financial transactions, etc.
+
+---
+
+## Current Architecture Analysis
+
+### Key Components Review
+
+1. **NER & Entity Extraction** (`graphiti_core/utils/maintenance/node_operations.py`, `graphiti_core/prompts/extract_nodes.py`)
+   - Hardcoded prompts for three episode types: message, text, JSON
+   - Domain-specific language (e.g., "speaker", "conversation")
+   - Entity type classification tightly coupled with extraction logic
+
+2. **LLM Client Configuration** (`graphiti_core/llm_client/config.py`, `graphiti_core/graphiti.py`)
+   - Defaults to OpenAI across all components
+   - No centralized model selection strategy
+   - Temperature (1.0) and max_tokens (8192) hardcoded as defaults
+
+3. **Episode Types** (`graphiti_core/nodes.py`)
+   - Limited to: message, text, JSON
+   - Each type requires separate prompt functions
+   - No extensibility mechanism for custom episode types
+
+4. **Prompt System** (`graphiti_core/prompts/`)
+   - Prompts are Python functions, not configurable data
+   - No template engine or override mechanism
+   - Domain assumptions embedded in prompt text
+
+5. **Search & Retrieval** (`graphiti_core/search/`)
+   - Flexible but complex configuration
+   - Limited domain-specific search recipes
+   - No semantic domain adapters
+
+---
+
+## Identified Issues from GitHub (Top 20)
+
+### High-Impact Issues Related to Domain Agnostic Goals:
+
+1. **#1087**: Embedding truncation reduces retrieval quality for text-embedding-3-small
+2. **#1074**: Neo4j quickstart returns no results with OpenAI-compatible LLM + Ollama embeddings
+3. **#1007**: OpenAIGenericClient outputs unstable for vllm serving gpt-oss-20b
+4. **#1006**: OpenAIRerankerClient does not support AzureOpenAILLMClient
+5. **#1004**: Azure OpenAI is not supported
+6. **#995**: Docker container does not support Azure OpenAI
+7. **#1077**: Support for Google Cloud Spanner Graph
+8. **#947**: Support for Apache AGE as Graph DB
+9. **#1016**: Support episode vector
+10. **#961**: Improve Episodes API - return UUID, support GET by ID, custom metadata
+
+---
+
+## Improvement Directives
+
+### 1. **Configurable Prompt System** 🔴 **Priority: CRITICAL**
+
+#### Objective
+Replace hardcoded prompt functions with a templatable, extensible prompt system that supports domain customization.
+
+#### Implementation Plan
+
+**Phase 1: Prompt Template Engine**
+- Create `PromptTemplate` class with variable interpolation
+- Support multiple template formats (Jinja2, mustache, or custom)
+- Add prompt registry for registration and lookup
+
+```python
+# Example API
+class PromptTemplate:
+    def __init__(self, template: str, variables: dict[str, str]):
+        self.template = template
+        self.variables = variables
+
+    def render(self, context: dict[str, Any]) -> str:
+        # Template rendering logic
+        pass
+
+class PromptRegistry:
+    def register(self, name: str, template: PromptTemplate) -> None:
+        pass
+
+    def get(self, name: str) -> PromptTemplate:
+        pass
+
+    def override(self, name: str, template: PromptTemplate) -> None:
+        pass
+```
+
+**Phase 2: Refactor Existing Prompts**
+- Convert all prompt functions in `graphiti_core/prompts/` to templates
+- Maintain backward compatibility with existing API
+- Add domain-specific prompt overrides
+
+**Phase 3: Documentation & Examples**
+- Create prompt customization guide
+- Provide domain-specific examples (legal, scientific, financial)
+- Add prompt testing utilities
+
+#### Priority Rationale
+- **Impact**: Enables all domain customization downstream
+- **Complexity**: Medium - requires careful refactoring
+- **Dependencies**: None - can be done independently
+
+#### Blockers
+- **Breaking Changes**: Need to maintain backward compatibility
+- **LLM Provider Compatibility**: Different providers may require different prompt formats
+- **Testing**: Need comprehensive test suite for prompt variations
+
+#### Success Metrics
+- Users can customize prompts without code changes
+- 5+ domain-specific prompt examples documented
+- No regression in existing use cases
+
+---
+
+### 2. **Pluggable NER & Entity Extraction Pipeline** 🔴 **Priority: CRITICAL**
+
+#### Objective
+Make the entity extraction pipeline modular and extensible for different domain requirements.
+
+#### Implementation Plan
+
+**Phase 1: Extraction Strategy Interface**
+- Define `ExtractionStrategy` protocol/abstract class
+- Support custom entity extractors (LLM-based, rule-based, hybrid)
+- Allow domain-specific entity type systems
+
+```python
+class ExtractionStrategy(Protocol):
+    async def extract_entities(
+        self,
+        episode: EpisodicNode,
+        context: dict[str, Any],
+        entity_types: dict[str, type[BaseModel]] | None = None,
+    ) -> list[EntityNode]:
+        ...
+
+    async def extract_relations(
+        self,
+        episode: EpisodicNode,
+        entities: list[EntityNode],
+        context: dict[str, Any],
+    ) -> list[EntityEdge]:
+        ...
+```
+
+**Phase 2: Domain-Specific Extractors**
+- Create extractors for common domains:
+  - `ScientificPaperExtractor`: Extracts researchers, institutions, findings, citations
+  - `LegalDocumentExtractor`: Extracts parties, cases, statutes, precedents
+  - `FinancialExtractor`: Extracts companies, transactions, indicators
+  - `IoTEventExtractor`: Extracts devices, sensors, readings, locations
+  - `HealthcareExtractor`: Extracts patients, conditions, treatments, providers
+
+**Phase 3: Extractor Composition**
+- Allow chaining multiple extractors
+- Support fallback strategies
+- Enable parallel extraction with merging
+
+#### Priority Rationale
+- **Impact**: Directly addresses domain specificity in core extraction
+- **Complexity**: High - touches critical path
+- **Dependencies**: Depends on Directive #1 (prompts)
+
+#### Blockers
+- **Performance**: Multiple extractors may impact latency
+- **Conflict Resolution**: Different extractors may produce conflicting entities
+- **Schema Validation**: Need flexible validation for diverse entity types
+
+#### Success Metrics
+- 3+ domain-specific extractors implemented
+- 50%+ reduction in domain customization code
+- No performance degradation for default use case
+
+---
+
+### 3. **Centralized Configuration Management** 🟡 **Priority: HIGH**
+
+#### Objective
+Create a unified configuration system for LLM clients, embedders, and other components.
+
+#### Implementation Plan
+
+**Phase 1: Configuration Schema**
+- Create `GraphitiConfig` with hierarchical structure
+- Support environment variables, config files (YAML/TOML), and programmatic config
+- Add validation with Pydantic
+
+```python
+class LLMProviderConfig(BaseModel):
+    provider: Literal["openai", "anthropic", "gemini", "groq", "custom"]
+    model: str
+    small_model: str | None = None
+    api_key: str | None = None
+    base_url: str | None = None
+    temperature: float = 1.0
+    max_tokens: int = 8192
+
+class EmbedderConfig(BaseModel):
+    provider: Literal["openai", "voyage", "gemini", "custom"]
+    model: str
+    api_key: str | None = None
+    embedding_dim: int | None = None
+
+class GraphitiConfig(BaseModel):
+    llm: LLMProviderConfig
+    embedder: EmbedderConfig
+    database: DatabaseConfig
+    extraction: ExtractionConfig
+    search: SearchConfig
+```
+
+**Phase 2: Config Loading & Merging**
+- Support config file discovery (`.graphiti.yaml`, `graphiti.config.toml`)
+- Merge configs from multiple sources (file < env < code)
+- Add config validation and helpful error messages
+
+**Phase 3: Domain-Specific Presets**
+- Create preset configs for common use cases
+- Support config inheritance and composition
+
+```yaml
+# Example: .graphiti.yaml
+extends: "presets/scientific-research"
+
+llm:
+  provider: anthropic
+  model: claude-sonnet-4-5-latest
+  temperature: 0.3
+
+extraction:
+  entity_types:
+    - Researcher
+    - Institution
+    - Finding
+    - Methodology
+
+  extractors:
+    - type: llm
+      prompt: prompts/scientific_entities.yaml
+    - type: regex
+      patterns: prompts/scientific_patterns.yaml
+```
+
+#### Priority Rationale
+- **Impact**: Simplifies deployment and customization
+- **Complexity**: Medium
+- **Dependencies**: None
+
+#### Blockers
+- **Backward Compatibility**: Must support existing initialization patterns
+- **Security**: API keys and credentials management
+- **Validation**: Complex validation rules across providers
+
+#### Success Metrics
+- Single config file for complete setup
+- Zero hardcoded defaults in core code
+- 10+ domain preset configs available
+
+---
+
+### 4. **Extensible Episode Type System** 🟡 **Priority: HIGH**
+
+#### Objective
+Allow users to define custom episode types with associated extraction logic.
+
+#### Implementation Plan
+
+**Phase 1: Episode Type Registry**
+- Create `EpisodeTypeRegistry` for dynamic episode types
+- Support custom episode type definitions with Pydantic
+
+```python
+class EpisodeTypeDefinition(BaseModel):
+    name: str
+    description: str
+    content_schema: type[BaseModel] | None = None
+    extraction_strategy: str | ExtractionStrategy
+    prompt_template: str | None = None
+
+class EpisodeTypeRegistry:
+    def register(self, episode_type: EpisodeTypeDefinition) -> None:
+        pass
+
+    def get(self, name: str) -> EpisodeTypeDefinition:
+        pass
+```
+
+**Phase 2: Dynamic Dispatch**
+- Modify `extract_nodes()` to dispatch based on episode type
+- Support fallback to default extraction for undefined types
+
+**Phase 3: Common Episode Types**
+- Provide built-in types for common domains:
+  - `scientific_paper`
+  - `legal_document`
+  - `financial_report`
+  - `iot_event`
+  - `healthcare_record`
+  - `email`
+  - `api_log`
+
+#### Priority Rationale
+- **Impact**: Removes major extensibility bottleneck
+- **Complexity**: Medium
+- **Dependencies**: Depends on Directive #2 (extractors)
+
+#### Blockers
+- **Type Safety**: Ensuring type safety with dynamic types
+- **Validation**: Schema validation for custom content
+- **Migration**: Migrating existing message/text/JSON types
+
+#### Success Metrics
+- Users can add episode types without code changes
+- 5+ built-in episode types for different domains
+- Clear migration path from existing types
+
+---
+
+### 5. **Domain-Specific Search Strategies** 🟢 **Priority: MEDIUM**
+
+#### Objective
+Provide domain-optimized search configurations and strategies.
+
+#### Implementation Plan
+
+**Phase 1: Search Strategy Templates**
+- Create domain-specific search configs in `search_config_recipes.py`
+- Optimize for domain characteristics (e.g., temporal for financial, spatial for IoT)
+
+```python
+# Examples
+FINANCIAL_TEMPORAL_SEARCH = SearchConfig(
+    edge_config=EdgeSearchConfig(
+        search_methods=[
+            EdgeSearchMethod.cosine_similarity,
+            EdgeSearchMethod.bm25,
+        ],
+        reranker=EdgeReranker.episode_mentions,
+    ),
+    # Prioritize recent events
+    # ... domain-specific configuration
+)
+
+SCIENTIFIC_CITATION_SEARCH = SearchConfig(
+    # Optimize for citation networks
+    # ... domain-specific configuration
+)
+```
+
+**Phase 2: Semantic Domain Adapters**
+- Create domain-specific query expansion
+- Add domain vocabulary mapping
+- Support domain-specific relevance scoring
+
+**Phase 3: Search Analytics**
+- Track search performance by domain
+- Provide domain-specific search insights
+- Auto-tune search configs based on usage
+
+#### Priority Rationale
+- **Impact**: Improves search quality for specific domains
+- **Complexity**: Low-Medium
+- **Dependencies**: None - additive feature
+
+#### Blockers
+- **Domain Expertise**: Requires deep understanding of each domain
+- **Evaluation**: Need domain-specific test datasets
+- **Maintenance**: Each domain strategy needs ongoing optimization
+
+#### Success Metrics
+- 5+ domain-optimized search strategies
+- Measurable improvement in domain-specific retrieval quality
+- Search strategy recommendation system
+
+---
+
+### 6. **Multi-Provider LLM & Embedder Support Enhancement** 🟢 **Priority: MEDIUM**
+
+#### Objective
+Improve support for diverse LLM and embedding providers, addressing current issues with Azure, Anthropic, and local models.
+
+#### Implementation Plan
+
+**Phase 1: Provider Abstraction Improvements**
+- Enhance `LLMClient` interface for provider-specific features
+- Better handling of structured output across providers (#1007)
+- Unified error handling and retries
+
+**Phase 2: Provider-Specific Optimizations**
+- Azure OpenAI full support (#1004, #995, #1006)
+- Anthropic optimization for structured output
+- Local model support (Ollama, vLLM) (#1074, #1007)
+- Google Cloud Vertex AI integration
+
+**Phase 3: Embedder Flexibility**
+- Support mixed embedding strategies (different models for nodes vs edges)
+- Domain-specific embedding fine-tuning
+- Embedding dimension adaptation (#1087)
+
+#### Priority Rationale
+- **Impact**: Addresses multiple GitHub issues, improves flexibility
+- **Complexity**: Medium-High (provider-specific quirks)
+- **Dependencies**: Related to Directive #3 (config)
+
+#### Blockers
+- **Provider API Changes**: External dependencies on provider APIs
+- **Testing**: Requires access to multiple provider accounts
+- **Cost**: Testing across providers can be expensive
+
+#### Success Metrics
+- All providers in CLAUDE.md fully supported
+- Resolution of issues #1004, #1006, #1007, #1074, #995
+- Provider switching with zero code changes
+
+---
+
+### 7. **Enhanced Metadata & Custom Attributes** 🟢 **Priority: MEDIUM**
+
+#### Objective
+Support domain-specific metadata on all graph elements (nodes, edges, episodes).
+
+#### Implementation Plan
+
+**Phase 1: Flexible Metadata Schema**
+- Add `custom_metadata: dict[str, Any]` to all core types
+- Support typed metadata with Pydantic models
+- Index metadata for searchability
+
+**Phase 2: Domain-Specific Attributes**
+- Support custom attributes per domain
+- Attribute extraction from episodes
+- Attribute-based filtering in search
+
+**Phase 3: Metadata API Improvements**
+- Episode API enhancements (#961)
+- Metadata update operations
+- Bulk metadata operations
+
+#### Priority Rationale
+- **Impact**: Enables rich domain modeling
+- **Complexity**: Low-Medium
+- **Dependencies**: Database schema changes
+
+#### Blockers
+- **Schema Migration**: Existing graphs need migration
+- **Index Performance**: Metadata indexing may impact performance
+- **Validation**: Complex validation for diverse metadata
+
+#### Success Metrics
+- Custom metadata on all graph elements
+- Metadata-based search and filtering
+- Resolution of issue #961
+
+---
+
+### 8. **Database Provider Expansion** 🔵 **Priority: LOW**
+
+#### Objective
+Support additional graph databases to meet diverse deployment requirements.
+
+#### Implementation Plan
+
+**Phase 1: Abstract Driver Interface**
+- Enhance `GraphDriver` abstraction
+- Standardize query translation layer
+- Support for property graph vs RDF models
+
+**Phase 2: New Drivers**
+- Google Cloud Spanner Graph (#1077)
+- Apache AGE (#947)
+- Amazon Neptune improvements (#1082)
+- TigerGraph, NebulaGraph
+
+**Phase 3: Driver Selection Guide**
+- Performance comparison matrix
+- Use case recommendations
+- Migration tools between drivers
+
+#### Priority Rationale
+- **Impact**: Addresses specific GitHub requests, increases deployment options
+- **Complexity**: High (each driver is significant work)
+- **Dependencies**: None
+
+#### Blockers
+- **Maintenance Burden**: Each driver requires ongoing support
+- **Feature Parity**: Different databases have different capabilities
+- **Testing**: Complex integration testing for each database
+
+#### Success Metrics
+- 2+ new database drivers
+- Resolution of issues #1077, #947
+- Database migration tools
+
+---
+
+### 9. **Documentation & Examples for Domain Adaptation** 🟡 **Priority: HIGH**
+
+#### Objective
+Comprehensive documentation showing how to adapt Graphiti to different domains.
+
+#### Implementation Plan
+
+**Phase 1: Domain Adaptation Guide**
+- Step-by-step guide for domain customization
+- Decision tree for configuration choices
+- Best practices for each domain type
+
+**Phase 2: Complete Domain Examples**
+- Scientific Research knowledge graph
+- Legal Document analysis
+- Financial Transaction network
+- IoT Event processing
+- Healthcare Records integration
+
+**Phase 3: Tutorial Series**
+- Video walkthroughs
+- Interactive Jupyter notebooks
+- Code generation tools for domain setup
+
+#### Priority Rationale
+- **Impact**: Critical for adoption in new domains
+- **Complexity**: Medium (requires domain expertise)
+- **Dependencies**: Depends on implementation of above directives
+
+#### Blockers
+- **Domain Expertise**: Need experts for each domain
+- **Maintenance**: Examples need to stay current with codebase
+- **Quality**: Need real-world datasets and validation
+
+#### Success Metrics
+- 5+ complete domain examples
+- Documentation coverage >80%
+- User-contributed domain examples
+
+---
+
+### 10. **Testing & Evaluation Framework for Domains** 🟢 **Priority: MEDIUM**
+
+#### Objective
+Create domain-specific test datasets and evaluation metrics.
+
+#### Implementation Plan
+
+**Phase 1: Domain Test Datasets**
+- Curate/generate test data for each domain
+- Include ground truth annotations
+- Support for evaluation benchmarks
+
+**Phase 2: Evaluation Metrics**
+- Domain-specific quality metrics
+- Extraction accuracy measurements
+- Search relevance evaluation
+
+**Phase 3: Continuous Evaluation**
+- Automated testing across domains
+- Performance regression detection
+- Quality dashboards
+
+#### Priority Rationale
+- **Impact**: Ensures quality across domains
+- **Complexity**: Medium
+- **Dependencies**: Depends on domain implementations
+
+#### Blockers
+- **Data Acquisition**: Domain datasets can be hard to obtain
+- **Annotation**: Ground truth annotation is expensive
+- **Standardization**: Metrics vary significantly by domain
+
+#### Success Metrics
+- Test coverage >70% across domains
+- Automated evaluation pipeline
+- Public benchmark results
+
+---
+
+## Implementation Roadmap
+
+### Phase 1: Foundation (Months 1-3)
+**Critical Infrastructure**
+- [ ] Directive #1: Configurable Prompt System
+- [ ] Directive #3: Centralized Configuration Management
+- [ ] Directive #9: Initial documentation framework
+
+**Estimated Effort**: 2-3 engineers, 3 months
+
+### Phase 2: Core Extensibility (Months 4-6)
+**Domain Adaptation**
+- [ ] Directive #2: Pluggable NER Pipeline
+- [ ] Directive #4: Extensible Episode Types
+- [ ] Directive #7: Enhanced Metadata
+
+**Estimated Effort**: 2-3 engineers, 3 months
+
+### Phase 3: Provider & Database Support (Months 7-9)
+**Infrastructure Expansion**
+- [ ] Directive #6: Multi-Provider LLM Support
+- [ ] Directive #8: Database Provider Expansion (Phase 1)
+
+**Estimated Effort**: 2 engineers, 3 months
+
+### Phase 4: Domain Optimization (Months 10-12)
+**Domain-Specific Features**
+- [ ] Directive #5: Domain-Specific Search
+- [ ] Directive #10: Testing & Evaluation Framework
+- [ ] Directive #9: Complete domain examples
+
+**Estimated Effort**: 2-3 engineers, 3 months
+
+---
+
+## Risk Assessment
+
+### High Risk
+1. **Breaking Changes**: Refactoring may break existing integrations
+   - *Mitigation*: Semantic versioning, deprecation warnings, migration guides
+
+2. **Performance Regression**: More abstraction may impact performance
+   - *Mitigation*: Continuous benchmarking, performance budgets
+
+3. **Complexity Creep**: Too much configurability can confuse users
+   - *Mitigation*: Sensible defaults, progressive disclosure, presets
+
+### Medium Risk
+1. **Provider API Changes**: External dependencies may change
+   - *Mitigation*: Abstract interfaces, version pinning, adapter pattern
+
+2. **Maintenance Burden**: More features = more maintenance
+   - *Mitigation*: Automated testing, clear ownership, deprecation policy
+
+3. **Documentation Debt**: Fast development may outpace docs
+   - *Mitigation*: Docs-as-code, automated doc generation, examples as tests
+
+### Low Risk
+1. **Community Adoption**: Users may not need all domains
+   - *Mitigation*: Modular architecture, optional components
+
+---
+
+## Success Criteria
+
+### Technical Metrics
+- [ ] Zero hardcoded domain assumptions in core library
+- [ ] 5+ domain-specific configurations available
+- [ ] All GitHub issues (#1004, #1006, #1007, #1074, #995, #1077, #947, #961) resolved
+- [ ] Test coverage >75% across all domains
+- [ ] Performance within 10% of current baseline
+
+### User Experience Metrics
+- [ ] Domain setup time <30 minutes (from docs)
+- [ ] Config-driven customization (no code changes for 80% of use cases)
+- [ ] 3+ community-contributed domain adaptations
+
+### Business Metrics
+- [ ] Adoption in 3+ new domains (outside conversational AI)
+- [ ] 50%+ reduction in customization support requests
+- [ ] Documentation satisfaction >4.0/5.0
+
+---
+
+## Appendix A: Affected Files
+
+### Core Files Requiring Changes
+
+**High Priority**
+- `graphiti_core/graphiti.py` - Main class, initialization
+- `graphiti_core/llm_client/config.py` - Configuration system
+- `graphiti_core/prompts/extract_nodes.py` - NER prompts
+- `graphiti_core/prompts/extract_edges.py` - Relation extraction prompts
+- `graphiti_core/utils/maintenance/node_operations.py` - Extraction logic
+
+**Medium Priority**
+- `graphiti_core/nodes.py` - Episode type definitions
+- `graphiti_core/search/search_config.py` - Search configuration
+- `graphiti_core/search/search_config_recipes.py` - Search recipes
+- `server/graph_service/config.py` - Server configuration
+
+**Low Priority**
+- `graphiti_core/driver/*.py` - Database drivers
+- `graphiti_core/embedder/*.py` - Embedder clients
+
+---
+
+## Appendix B: Related GitHub Issues
+
+### Directly Addressed
+- #1087: Embedding truncation
+- #1074: No results with Ollama embeddings
+- #1007: Unstable outputs with vLLM
+- #1006: AzureOpenAI reranker support
+- #1004: Azure OpenAI support
+- #995: Docker Azure OpenAI support
+- #1077: Google Cloud Spanner Graph support
+- #947: Apache AGE support
+- #961: Episodes API improvements
+- #1082: Neptune driver issues
+
+### Indirectly Improved
+- #1083: Orphaned entities cleanup
+- #1062: Stale data in MCP server
+- #1021: Incomplete graph structure
+- #1018: Search with group_ids
+- #1012: group_id and Anthropic issues
+- #992: OOM in build_communities
+- #963: Duplicate entities
+
+---
+
+## Appendix C: Backward Compatibility Strategy
+
+### Deprecation Policy
+1. **Feature Deprecation**: 2 minor versions notice
+2. **API Changes**: Maintain old API with deprecation warnings
+3. **Configuration**: Support both old and new config formats during transition
+
+### Migration Support
+- Automated migration scripts for major changes
+- Detailed migration guides for each release
+- Migration validation tools
+
+### Version Support
+- LTS releases for enterprise users
+- Security patches for N-2 versions
+- Clear EOL policy
+
+---
+
+## Next Steps
+
+1. **Review & Approval**: Circulate this plan for stakeholder feedback
+2. **Prioritization**: Finalize directive priorities based on business needs
+3. **Resource Allocation**: Assign engineering teams to Phase 1 directives
+4. **Kickoff**: Begin implementation of Directive #1 (Prompt System)
+
+---
+
+**Document Maintainer**: Claude (AI Assistant)
+**Last Updated**: 2025-11-30
+**Next Review**: After Phase 1 completion
diff --git a/PR_DESCRIPTION.md b/PR_DESCRIPTION.md
new file mode 100644
index 000000000..580ad63b3
--- /dev/null
+++ b/PR_DESCRIPTION.md
@@ -0,0 +1,169 @@
+## Summary
+
+This PR adds experimental support for **Apache TinkerPop Gremlin** as an alternative query language for AWS Neptune Database, alongside the existing openCypher support. This enables users to choose their preferred query language and opens the door for future support of other Gremlin-compatible databases (Azure Cosmos DB, JanusGraph, DataStax Graph, etc.).
+
+## Motivation
+
+While Graphiti currently supports AWS Neptune Database using openCypher, Neptune also natively supports Gremlin, which:
+
+- Is Neptune's native query language with potentially better performance for certain traversal patterns
+- Provides an alternative query paradigm for users who prefer imperative traversal syntax
+- Opens the door for broader database compatibility with the TinkerPop ecosystem
+
+## Key Features
+
+- ✅ `QueryLanguage` enum (CYPHER, GREMLIN) for explicit language selection
+- ✅ Dual-mode `NeptuneDriver` supporting both Cypher and Gremlin
+- ✅ Gremlin query generation functions for common graph operations
+- ✅ Graceful degradation when `gremlinpython` is not installed
+- ✅ 100% backward compatible (defaults to CYPHER)
+
+## Implementation Details
+
+### Core Infrastructure
+- **graphiti_core/driver/driver.py**: Added `QueryLanguage` enum and `query_language` field to base driver
+- **graphiti_core/driver/neptune_driver.py**:
+  - Dual client initialization (Cypher via langchain-aws, Gremlin via gremlinpython)
+  - Query routing based on language selection
+  - Separate `_run_cypher_query()` and `_run_gremlin_query()` methods
+- **graphiti_core/graph_queries.py**: 9 new Gremlin query generation functions:
+  - `gremlin_match_node_by_property()`
+  - `gremlin_match_nodes_by_uuids()`
+  - `gremlin_match_edge_by_property()`
+  - `gremlin_get_outgoing_edges()`
+  - `gremlin_bfs_traversal()`
+  - `gremlin_delete_all_nodes()`
+  - `gremlin_delete_nodes_by_group_id()`
+  - `gremlin_retrieve_episodes()`
+  - `gremlin_cosine_similarity_filter()` (placeholder)
+
+### Maintenance Operations
+- **graphiti_core/utils/maintenance/graph_data_operations.py**: Updated `clear_data()` to support both query languages
+
+### Testing & Documentation
+- **tests/test_neptune_gremlin_int.py**: Comprehensive integration tests
+- **examples/quickstart/quickstart_neptune_gremlin.py**: Working usage example
+- **examples/quickstart/README.md**: Updated with Gremlin instructions
+- **GREMLIN_FEATURE.md**: Complete feature documentation
+
+### Dependencies
+- **pyproject.toml**: Added `gremlinpython>=3.7.0` to neptune and dev extras
+
+## Usage Example
+
+```python
+from graphiti_core import Graphiti
+from graphiti_core.driver.driver import QueryLanguage
+from graphiti_core.driver.neptune_driver import NeptuneDriver
+from graphiti_core.llm_client import OpenAIClient
+
+# Create Neptune driver with Gremlin query language
+driver = NeptuneDriver(
+    host='neptune-db://your-cluster.amazonaws.com',
+    aoss_host='your-aoss-cluster.amazonaws.com',
+    query_language=QueryLanguage.GREMLIN  # Use Gremlin instead of Cypher
+)
+
+llm_client = OpenAIClient()
+graphiti = Graphiti(driver, llm_client)
+
+# The high-level Graphiti API remains unchanged
+await graphiti.build_indices_and_constraints()
+await graphiti.add_episode(...)
+results = await graphiti.search(...)
+```
+
+## Installation
+
+```bash
+# Install with Neptune and Gremlin support
+pip install graphiti-core[neptune]
+```
+
+## Current Limitations
+
+### Supported ✅
+- Basic graph operations (CRUD on nodes/edges)
+- Graph traversal and BFS
+- Maintenance operations (clear_data, delete by group_id)
+- Neptune Database clusters
+
+### Not Yet Supported ❌
+- Neptune Analytics (only supports Cypher)
+- Direct Gremlin-based fulltext search (still uses OpenSearch)
+- Direct Gremlin-based vector similarity (still uses OpenSearch)
+- Complete `search_utils.py` Gremlin implementation (marked for future work)
+
+### Why OpenSearch is Still Used
+
+Neptune's Gremlin implementation doesn't include native fulltext search or vector similarity functions. These operations continue to use the existing OpenSearch (AOSS) integration, which provides:
+
+- BM25 fulltext search across node/edge properties
+- Vector similarity search via k-NN
+- Hybrid search capabilities
+
+This hybrid approach (Gremlin for graph traversal + OpenSearch for search) is a standard pattern for production Neptune applications.
+
+## Testing
+
+- ✅ All existing unit tests pass (103/103)
+- ✅ New integration tests for Gremlin operations
+- ✅ Type checking passes with pyright
+- ✅ Linting passes with ruff
+
+```bash
+# Run unit tests
+uv run pytest tests/ -k "not _int"
+
+# Run Gremlin integration tests (requires Neptune Database)
+uv run pytest tests/test_neptune_gremlin_int.py
+```
+
+## Breaking Changes
+
+**None.** This is fully backward compatible:
+- Default query language is `CYPHER` (existing behavior unchanged)
+- `gremlinpython` is an optional dependency
+- All existing code continues to work without modifications
+
+## Future Work
+
+The following enhancements are planned for future iterations:
+
+1. **Complete search_utils.py Gremlin Support**
+   - Implement Gremlin-specific versions of hybrid search functions
+   - May require custom Gremlin steps or continued OpenSearch integration
+
+2. **Broader Database Support**
+   - Azure Cosmos DB (Gremlin API)
+   - JanusGraph
+   - DataStax Graph
+   - Any Apache TinkerPop 3.x compatible database
+
+3. **Performance Benchmarking**
+   - Compare Cypher vs Gremlin performance on Neptune
+   - Identify optimal use cases for each language
+
+## Checklist
+
+- [x] Code follows project style guidelines (ruff formatting)
+- [x] Type checking passes (pyright)
+- [x] All tests pass
+- [x] Documentation updated (README, examples, GREMLIN_FEATURE.md)
+- [x] Backward compatibility maintained
+- [x] No breaking changes
+
+## Related Issues
+
+This addresses feature requests for:
+- Broader database compatibility
+- Neptune Gremlin support
+- Alternative query language options
+
+## Additional Notes
+
+See `GREMLIN_FEATURE.md` in the repository for complete technical documentation, including detailed implementation notes and architecture decisions.
+
+---
+
+🤖 Generated with [Claude Code](https://claude.com/claude-code)
diff --git a/TODOs.md b/TODOs.md
new file mode 100644
index 000000000..0f8184b3c
--- /dev/null
+++ b/TODOs.md
@@ -0,0 +1,73 @@
+### 7. Suggestions for Improving Graphiti's RAG Techniques
+
+Graphiti already employs a sophisticated RAG pipeline that surpasses standard vector search by using a dynamic knowledge graph. The following suggestions aim to build upon this strong foundation by incorporating more advanced RAG strategies to enhance retrieval accuracy, contextual understanding, and overall performance.
+
+---
+
+#### 1. Advanced Query Pre-processing
+
+The current approach of combining recent messages into a single search query is effective for context. However, it can be enhanced by adding a more structured query analysis step before retrieval.
+
+**Current State:** A recent conversation history is concatenated into a single string for searching.
+*   **Source Snippet (`agent.ipynb`):**
+    ```python name=examples/langgraph-agent/agent.ipynb url=https://github.com/getzep/graphiti/blob/main/examples/langgraph-agent/agent.ipynb
+    graphiti_query = f'{\"SalesBot\" if isinstance(last_message, AIMessage) else state[\"user_name\"]}: {last_message.content}'
+    ```
+
+**Suggested Improvements:**
+
+*   **Query Decomposition:** For multi-faceted questions, an LLM call could break the query down into multiple sub-queries that are executed against the graph. The results can then be synthesized.
+    *   **Example:** A query like *"What non-wool shoes would John like that are available in his size (10)?"* could be decomposed into:
+        1.  `search("John's preferences")` -> Retrieves facts like `John LIKES "Basin Blue"`.
+        2.  `search("John's shoe size")` -> Retrieves `John HAS_SHOE_SIZE "10"`.
+        3.  `search("shoes NOT made of wool")` -> Retrieves products made of cotton, tree fiber, etc.
+    *   **Benefit:** This provides more targeted retrieval than a single, complex query, reducing noise and improving the relevance of retrieved facts.
+
+*   **Hypothetical Document Embeddings (HyDE):** Before performing a semantic search, the LLM can generate a hypothetical "perfect" answer to the user's query. The embedding of this *hypothetical answer* is then used for the vector search, which often yields more relevant results than embedding the query itself.
+    *   **Example:** For the query *"What makes the Men's Couriers special?"*, the LLM might generate a hypothetical fact: *"The Men's Couriers are special because they feature a retro silhouette and are made from natural materials like cotton."* The embedding of this sentence is then used to find real facts in the graph.
+    *   **Benefit:** This bridges the gap between the "question space" and the "answer space" in vector embeddings, leading to better semantic matches.
+
+---
+
+#### 2. Enhanced Graph-Native Retrieval and Summarization
+
+Graphiti's core strength is the graph itself. Retrieval can be made even more powerful by leveraging graph topology more deeply.
+
+**Current State:** The system uses graph traversal for re-ranking via `center_node_uuid` and detects communities (`build_communities` in the Neptune example).
+
+**Suggested Improvements:**
+
+*   **Recursive Retrieval & Graph-Based Summarization:** Retrieval can be a multi-step process.
+    1.  **Initial Retrieval:** Retrieve a set of initial facts/nodes as is currently done.
+    2.  **Neighbor Exploration:** For the top N initial nodes, automatically retrieve their direct neighbors. This can uncover critical context that wasn't captured by the initial query.
+    3.  **LLM-Powered Summarization:** Pass the retrieved sub-graph (initial nodes + neighbors) to an LLM with a prompt like: *"Summarize the key information and relationships in the following set of facts: [facts list]"*.
+    *   **Benefit:** This moves beyond retrieving a simple list of facts to retrieving a *synthesized insight* from a relevant portion of the graph, which is a much more compressed and potent form of context for the final generation step.
+
+*   **Leverage Pre-computed Communities:** The `build_communities` method is a powerful feature. These communities can be used to generate summary nodes *ahead of time*.
+    *   **Implementation:** After running community detection, for each community, create a new `Summary` node. Use an LLM to generate a description for this node that summarizes the entities within that community.
+    *   **Example:** A community of nodes related to "SuperLight Wool Runners" could have a summary node: *"This product family is characterized by its lightweight SuperLight Foam technology and wool-based materials."*
+    *   **Benefit:** During retrieval, if the query matches this summary node, the system can retrieve a single, dense summary instead of dozens of individual product facts, leading to massive prompt compression and faster, more coherent context.
+
+---
+
+#### 3. Optimized Ranking and Post-processing
+
+The final step of filtering and ranking retrieved facts is crucial for prompt quality.
+
+**Current State:** Graphiti uses a hybrid search and likely some form of score fusion (like RRF, as hinted in `search_config_recipes`) to rank results.
+
+**Suggested Improvements:**
+
+*   **LLM-based Re-ranking:** After retrieving an initial set of candidate facts (e.g., the top 20-30), use a smaller, faster LLM to perform a final re-ranking pass.
+    *   **Implementation:** The LLM would be prompted with the original query and each fact, and asked to output a relevance score (e.g., 1-10) or a simple "relevant/not relevant" judgment.
+    *   **Benefit:** This can catch nuanced relevance that semantic or keyword scores might miss, providing a final layer of polish to the retrieved context. It is more expensive but can significantly improve the quality of the top-k results.
+
+*   **Structured Fact Output:** Instead of returning a flat list of fact strings, the retrieval endpoint could return a structured JSON object that preserves the `Subject-Predicate-Object` nature of the facts.
+    *   **Example:**
+        ```json
+        [
+          { "subject": "John", "predicate": "IS_ALLERGIC_TO", "object": "wool" },
+          { "subject": "John", "predicate": "HAS_SHOE_SIZE", "object": "10" }
+        ]
+        ```
+    *   **Benefit:** This structured format is more easily parsed by the final generation LLM, which can be explicitly prompted to "pay attention to the relationships between subjects and objects." This is a more direct way of "prompting a graph" and can lead to more logical and accurate responses. This also helps the LLM differentiate between entities and their attributes more clearly.
\ No newline at end of file
diff --git a/docs/CONFIGURATION.md b/docs/CONFIGURATION.md
new file mode 100644
index 000000000..be765245a
--- /dev/null
+++ b/docs/CONFIGURATION.md
@@ -0,0 +1,409 @@
+# Graphiti Configuration Guide
+
+This guide explains how to configure Graphiti using the new unified configuration system introduced in v0.24.2.
+
+## Overview
+
+Graphiti now supports flexible configuration through:
+- **YAML configuration files** for declarative setup
+- **Environment variables** for secrets and deployment-specific settings
+- **Programmatic configuration** for dynamic setups
+- **Backward compatibility** with existing initialization patterns
+
+## Quick Start
+
+### Option 1: YAML Configuration (Recommended)
+
+Create a `.graphiti.yaml` file in your project root:
+
+```yaml
+llm:
+  provider: anthropic
+  model: claude-sonnet-4-5-latest
+  temperature: 0.7
+
+embedder:
+  provider: voyage
+  model: voyage-3
+
+database:
+  provider: neo4j
+  uri: "bolt://localhost:7687"
+  user: neo4j
+  password: password
+```
+
+Then initialize Graphiti:
+
+```python
+from graphiti_core import Graphiti
+from graphiti_core.config import GraphitiConfig
+
+# Load from default .graphiti.yaml
+config = GraphitiConfig.from_env()
+graphiti = Graphiti.from_config(config)
+
+# Or load from specific file
+config = GraphitiConfig.from_yaml("path/to/config.yaml")
+graphiti = Graphiti.from_config(config)
+```
+
+### Option 2: Programmatic Configuration
+
+```python
+from graphiti_core import Graphiti
+from graphiti_core.config import (
+    GraphitiConfig,
+    LLMProviderConfig,
+    EmbedderConfig,
+    DatabaseConfig,
+    LLMProvider,
+    EmbedderProvider,
+)
+
+config = GraphitiConfig(
+    llm=LLMProviderConfig(
+        provider=LLMProvider.ANTHROPIC,
+        model="claude-sonnet-4-5-latest",
+    ),
+    embedder=EmbedderConfig(
+        provider=EmbedderProvider.VOYAGE,
+    ),
+    database=DatabaseConfig(
+        uri="bolt://localhost:7687",
+        user="neo4j",
+        password="password",
+    ),
+)
+
+graphiti = Graphiti.from_config(config)
+```
+
+### Option 3: Traditional Initialization (Backward Compatible)
+
+```python
+from graphiti_core import Graphiti
+
+# Still works as before!
+graphiti = Graphiti(
+    uri="bolt://localhost:7687",
+    user="neo4j",
+    password="password",
+)
+```
+
+## Supported Providers
+
+### LLM Providers
+
+| Provider | Value | Install Command | Notes |
+|----------|-------|----------------|-------|
+| OpenAI | `openai` | Built-in | Default provider |
+| Azure OpenAI | `azure_openai` | Built-in | Requires `base_url` and `azure_deployment` |
+| Anthropic | `anthropic` | `pip install graphiti-core[anthropic]` | Claude models |
+| Google Gemini | `gemini` | `pip install graphiti-core[google-genai]` | Gemini models |
+| Groq | `groq` | `pip install graphiti-core[groq]` | Fast inference |
+| LiteLLM | `litellm` | `pip install graphiti-core[litellm]` | Unified interface for 100+ providers |
+| Custom | `custom` | - | Bring your own client |
+
+### Embedder Providers
+
+| Provider | Value | Install Command | Default Model |
+|----------|-------|----------------|---------------|
+| OpenAI | `openai` | Built-in | text-embedding-3-small |
+| Azure OpenAI | `azure_openai` | Built-in | text-embedding-3-small |
+| Voyage AI | `voyage` | `pip install graphiti-core[voyageai]` | voyage-3 |
+| Google Gemini | `gemini` | `pip install graphiti-core[google-genai]` | text-embedding-004 |
+| Custom | `custom` | - | Bring your own embedder |
+
+### Database Providers
+
+| Provider | Value | Install Command | Notes |
+|----------|-------|----------------|-------|
+| Neo4j | `neo4j` | Built-in | Default provider |
+| FalkorDB | `falkordb` | `pip install graphiti-core[falkordb]` | Redis-based graph DB |
+| Neptune | `neptune` | `pip install graphiti-core[neptune]` | AWS Neptune |
+| Custom | `custom` | - | Bring your own driver |
+
+## Configuration Examples
+
+### Azure OpenAI
+
+```yaml
+llm:
+  provider: azure_openai
+  base_url: "https://your-resource.openai.azure.com"
+  azure_deployment: "gpt-4-deployment"
+  azure_api_version: "2024-10-21"
+  # api_key via AZURE_OPENAI_API_KEY env var
+
+embedder:
+  provider: azure_openai
+  base_url: "https://your-resource.openai.azure.com"
+  azure_deployment: "embedding-deployment"
+  model: text-embedding-3-small
+
+database:
+  provider: neo4j
+  uri: "bolt://localhost:7687"
+  user: neo4j
+  password: password
+```
+
+### LiteLLM for Multi-Cloud
+
+LiteLLM provides a unified interface to 100+ LLM providers:
+
+```yaml
+llm:
+  provider: litellm
+  litellm_model: "azure/gpt-4-deployment"  # Azure OpenAI
+  # Or: "bedrock/anthropic.claude-3-sonnet-20240229-v1:0"  # AWS Bedrock
+  # Or: "ollama/llama2"  # Local Ollama
+  # Or: "vertex_ai/gemini-pro"  # Google Vertex AI
+  base_url: "https://your-resource.openai.azure.com"
+  api_key: "your-key"
+```
+
+### Local Models with Ollama
+
+```yaml
+llm:
+  provider: litellm
+  litellm_model: "ollama/llama2"
+  base_url: "http://localhost:11434"
+  temperature: 0.8
+  max_tokens: 4096
+
+embedder:
+  provider: openai  # Or use local embeddings
+  model: text-embedding-3-small
+```
+
+### Anthropic + Voyage AI
+
+```yaml
+llm:
+  provider: anthropic
+  model: claude-sonnet-4-5-latest
+  small_model: claude-haiku-4-5-latest
+  temperature: 0.7
+
+embedder:
+  provider: voyage
+  model: voyage-3
+  dimensions: 1024
+```
+
+### Google Gemini
+
+```yaml
+llm:
+  provider: gemini
+  model: gemini-2.5-flash
+  temperature: 0.9
+
+embedder:
+  provider: gemini
+  model: text-embedding-004
+  dimensions: 768
+```
+
+## Environment Variables
+
+API keys and secrets can be provided via environment variables:
+
+| Provider | Environment Variable |
+|----------|---------------------|
+| OpenAI | `OPENAI_API_KEY` |
+| Azure OpenAI | `AZURE_OPENAI_API_KEY` |
+| Anthropic | `ANTHROPIC_API_KEY` |
+| Google Gemini | `GOOGLE_API_KEY` |
+| Groq | `GROQ_API_KEY` |
+| Voyage AI | `VOYAGE_API_KEY` |
+
+Configuration file location:
+- `GRAPHITI_CONFIG_PATH`: Path to configuration YAML file
+
+Example:
+```bash
+export OPENAI_API_KEY="sk-..."
+export ANTHROPIC_API_KEY="sk-ant-..."
+export GRAPHITI_CONFIG_PATH="/path/to/config.yaml"
+```
+
+## Configuration Reference
+
+### LLMProviderConfig
+
+| Field | Type | Description | Default |
+|-------|------|-------------|---------|
+| `provider` | `LLMProvider` | LLM provider to use | `openai` |
+| `model` | `str` | Model name | Provider default |
+| `small_model` | `str` | Smaller model for simple tasks | Provider default |
+| `api_key` | `str` | API key (or from env) | From environment |
+| `base_url` | `str` | API base URL | Provider default |
+| `temperature` | `float` | Sampling temperature (0-2) | `1.0` |
+| `max_tokens` | `int` | Maximum tokens in response | `8192` |
+| `azure_deployment` | `str` | Azure deployment name | `None` |
+| `azure_api_version` | `str` | Azure API version | `2024-10-21` |
+| `litellm_model` | `str` | LiteLLM model string | `None` |
+
+### EmbedderConfig
+
+| Field | Type | Description | Default |
+|-------|------|-------------|---------|
+| `provider` | `EmbedderProvider` | Embedder provider | `openai` |
+| `model` | `str` | Embedding model name | Provider default |
+| `api_key` | `str` | API key (or from env) | From environment |
+| `base_url` | `str` | API base URL | Provider default |
+| `dimensions` | `int` | Embedding dimensions | Provider default |
+| `azure_deployment` | `str` | Azure deployment name | `None` |
+| `azure_api_version` | `str` | Azure API version | `2024-10-21` |
+
+### DatabaseConfig
+
+| Field | Type | Description | Default |
+|-------|------|-------------|---------|
+| `provider` | `DatabaseProvider` | Database provider | `neo4j` |
+| `uri` | `str` | Database connection URI | `None` |
+| `user` | `str` | Database username | `None` |
+| `password` | `str` | Database password | `None` |
+| `database` | `str` | Database name | Provider default |
+
+### GraphitiConfig
+
+| Field | Type | Description | Default |
+|-------|------|-------------|---------|
+| `llm` | `LLMProviderConfig` | LLM configuration | Default config |
+| `embedder` | `EmbedderConfig` | Embedder configuration | Default config |
+| `reranker` | `RerankerConfig` | Reranker configuration | Default config |
+| `database` | `DatabaseConfig` | Database configuration | Default config |
+| `store_raw_episode_content` | `bool` | Store raw episode content | `True` |
+| `max_coroutines` | `int` | Max concurrent operations | `None` |
+
+## Migration Guide
+
+### From Traditional Initialization
+
+**Before:**
+```python
+graphiti = Graphiti(
+    uri="bolt://localhost:7687",
+    user="neo4j",
+    password="password",
+)
+```
+
+**After (with config):**
+```python
+from graphiti_core.config import GraphitiConfig, DatabaseConfig
+
+config = GraphitiConfig(
+    database=DatabaseConfig(
+        uri="bolt://localhost:7687",
+        user="neo4j",
+        password="password",
+    )
+)
+graphiti = Graphiti.from_config(config)
+```
+
+**Or with YAML:**
+```yaml
+# .graphiti.yaml
+database:
+  uri: "bolt://localhost:7687"
+  user: neo4j
+  password: password
+```
+
+```python
+config = GraphitiConfig.from_env()
+graphiti = Graphiti.from_config(config)
+```
+
+### From Custom Clients
+
+**Before:**
+```python
+from graphiti_core.llm_client.anthropic_client import AnthropicClient
+
+llm = AnthropicClient(...)
+graphiti = Graphiti(
+    uri="...",
+    llm_client=llm,
+)
+```
+
+**After:**
+```python
+from graphiti_core.config import GraphitiConfig, LLMProviderConfig, LLMProvider
+
+config = GraphitiConfig(
+    llm=LLMProviderConfig(provider=LLMProvider.ANTHROPIC),
+)
+graphiti = Graphiti.from_config(config)
+```
+
+## Benefits
+
+1. **Centralized Configuration**: All settings in one place
+2. **Environment-Specific Configs**: Different configs for dev/staging/prod
+3. **No Code Changes**: Switch providers via config file
+4. **Better Validation**: Pydantic validates all settings
+5. **Multi-Provider Support**: Easy integration with LiteLLM
+6. **Backward Compatible**: Existing code continues to work
+
+## Troubleshooting
+
+### Missing Dependencies
+
+If you get an import error for a provider:
+
+```
+ImportError: Anthropic client requires anthropic package.
+Install with: pip install graphiti-core[anthropic]
+```
+
+Install the required optional dependency:
+```bash
+pip install graphiti-core[anthropic]
+pip install graphiti-core[voyageai]
+pip install graphiti-core[litellm]
+```
+
+### Azure OpenAI Configuration
+
+Azure OpenAI requires:
+- `base_url`: Your Azure endpoint
+- `azure_deployment`: Deployment name (not model name)
+- `api_key`: Azure API key (or via `AZURE_OPENAI_API_KEY`)
+
+### LiteLLM Model Format
+
+LiteLLM uses specific format for models:
+- Azure: `azure/deployment-name`
+- Bedrock: `bedrock/model-id`
+- Ollama: `ollama/model-name`
+- Vertex AI: `vertex_ai/model-name`
+
+See [LiteLLM docs](https://docs.litellm.ai/docs/providers) for more providers.
+
+## Examples
+
+See `examples/graphiti_config_example.yaml` for a complete configuration example with multiple provider options.
+
+## Related Issues
+
+This feature addresses:
+- #1004: Azure OpenAI support
+- #1006: Azure OpenAI reranker support
+- #1007: vLLM/OpenAI-compatible provider stability
+- #1074: Ollama embeddings support
+
+## Further Reading
+
+- [LiteLLM Documentation](https://docs.litellm.ai/)
+- [Pydantic Settings Documentation](https://docs.pydantic.dev/latest/concepts/pydantic_settings/)
+- [Neo4j Connection Strings](https://neo4j.com/docs/operations-manual/current/configuration/connectors/)
diff --git a/examples/graphiti_config_example.yaml b/examples/graphiti_config_example.yaml
new file mode 100644
index 000000000..352f59282
--- /dev/null
+++ b/examples/graphiti_config_example.yaml
@@ -0,0 +1,83 @@
+# Graphiti Configuration Example
+# Save this file as .graphiti.yaml or specify path via GRAPHITI_CONFIG_PATH environment variable
+
+# LLM Configuration
+llm:
+  # Provider: openai, azure_openai, anthropic, gemini, groq, litellm, custom
+  provider: anthropic
+  model: claude-sonnet-4-5-latest
+  small_model: claude-haiku-4-5-latest
+  temperature: 0.7
+  max_tokens: 8192
+  # api_key: "your-api-key"  # Or set via ANTHROPIC_API_KEY environment variable
+
+# Embedder Configuration
+embedder:
+  # Provider: openai, azure_openai, voyage, gemini, custom
+  provider: voyage
+  model: voyage-3
+  dimensions: 1024
+  # api_key: "your-voyage-key"  # Or set via VOYAGE_API_KEY environment variable
+
+# Reranker Configuration
+reranker:
+  # Provider: openai, azure_openai, custom
+  provider: openai
+  # api_key: "your-api-key"  # Or set via OPENAI_API_KEY environment variable
+
+# Database Configuration
+database:
+  # Provider: neo4j, falkordb, neptune, custom
+  provider: neo4j
+  uri: "bolt://localhost:7687"
+  user: neo4j
+  password: password
+  database: graphiti
+
+# General Settings
+store_raw_episode_content: true
+max_coroutines: null  # null uses default
+
+---
+# Azure OpenAI Example
+# Uncomment and modify for Azure OpenAI setup
+
+# llm:
+#   provider: azure_openai
+#   base_url: "https://your-resource.openai.azure.com"
+#   azure_deployment: "gpt-4-deployment-name"
+#   azure_api_version: "2024-10-21"
+#   api_key: "your-azure-key"  # Or set via AZURE_OPENAI_API_KEY
+#   temperature: 1.0
+#   max_tokens: 8192
+
+# embedder:
+#   provider: azure_openai
+#   base_url: "https://your-resource.openai.azure.com"
+#   azure_deployment: "embedding-deployment-name"
+#   azure_api_version: "2024-10-21"
+#   model: text-embedding-3-small
+#   api_key: "your-azure-key"  # Or set via AZURE_OPENAI_API_KEY
+
+---
+# LiteLLM Multi-Provider Example
+# Use LiteLLM for unified access to 100+ LLM providers
+
+# llm:
+#   provider: litellm
+#   litellm_model: "azure/gpt-4-deployment"  # Or "bedrock/claude-3", "ollama/llama2", etc.
+#   base_url: "https://your-resource.openai.azure.com"  # For Azure
+#   api_key: "your-key"
+#   temperature: 1.0
+#   max_tokens: 8192
+
+---
+# Local Models Example
+# Use Ollama or other local models via LiteLLM
+
+# llm:
+#   provider: litellm
+#   litellm_model: "ollama/llama2"
+#   base_url: "http://localhost:11434"
+#   temperature: 0.8
+#   max_tokens: 4096
diff --git a/graphiti_core/config/__init__.py b/graphiti_core/config/__init__.py
new file mode 100644
index 000000000..74aaa0c95
--- /dev/null
+++ b/graphiti_core/config/__init__.py
@@ -0,0 +1,34 @@
+"""
+Copyright 2024, Zep Software, Inc.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+from .providers import EmbedderProvider, LLMProvider
+from .settings import (
+    DatabaseConfig,
+    EmbedderConfig,
+    GraphitiConfig,
+    LLMProviderConfig,
+    RerankerConfig,
+)
+
+__all__ = [
+    'GraphitiConfig',
+    'LLMProviderConfig',
+    'EmbedderConfig',
+    'RerankerConfig',
+    'DatabaseConfig',
+    'LLMProvider',
+    'EmbedderProvider',
+]
diff --git a/graphiti_core/config/factory.py b/graphiti_core/config/factory.py
new file mode 100644
index 000000000..c9ae3da10
--- /dev/null
+++ b/graphiti_core/config/factory.py
@@ -0,0 +1,321 @@
+"""
+Copyright 2024, Zep Software, Inc.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import importlib
+import logging
+from typing import TYPE_CHECKING
+
+from ..cross_encoder.client import CrossEncoderClient
+from ..cross_encoder.openai_reranker_client import OpenAIRerankerClient
+from ..driver.driver import GraphDriver
+from ..embedder.client import EmbedderClient
+from ..llm_client.client import LLMClient
+from ..llm_client.config import LLMConfig
+from .providers import DatabaseProvider, EmbedderProvider, LLMProvider, RerankerProvider
+
+if TYPE_CHECKING:
+    from .settings import DatabaseConfig, EmbedderConfig, LLMProviderConfig, RerankerConfig
+
+logger = logging.getLogger(__name__)
+
+
+def create_llm_client(config: 'LLMProviderConfig') -> LLMClient:
+    """Create an LLM client based on configuration.
+
+    Args:
+        config: LLM provider configuration
+
+    Returns:
+        Configured LLM client instance
+
+    Raises:
+        ValueError: If provider is not supported or configuration is invalid
+        ImportError: If required dependencies for the provider are not installed
+    """
+    # Create LLMConfig from provider config
+    llm_config = LLMConfig(
+        api_key=config.api_key,
+        model=config.model,
+        base_url=config.base_url,
+        temperature=config.temperature,
+        max_tokens=config.max_tokens,
+        small_model=config.small_model,
+    )
+
+    if config.provider == LLMProvider.OPENAI:
+        from ..llm_client.openai_client import OpenAIClient
+
+        return OpenAIClient(llm_config)
+
+    elif config.provider == LLMProvider.AZURE_OPENAI:
+        from ..llm_client.azure_openai_client import AzureOpenAILLMClient
+
+        if not config.azure_deployment:
+            raise ValueError('azure_deployment is required for Azure OpenAI provider')
+
+        return AzureOpenAILLMClient(
+            llm_config,
+            azure_deployment=config.azure_deployment,
+            azure_api_version=config.azure_api_version or '2024-10-21',
+        )
+
+    elif config.provider == LLMProvider.ANTHROPIC:
+        try:
+            from ..llm_client.anthropic_client import AnthropicClient
+
+            return AnthropicClient(llm_config)
+        except ImportError as e:
+            raise ImportError(
+                'Anthropic client requires anthropic package. '
+                'Install with: pip install graphiti-core[anthropic]'
+            ) from e
+
+    elif config.provider == LLMProvider.GEMINI:
+        try:
+            from ..llm_client.gemini_client import GeminiClient
+
+            return GeminiClient(llm_config)
+        except ImportError as e:
+            raise ImportError(
+                'Gemini client requires google-genai package. '
+                'Install with: pip install graphiti-core[google-genai]'
+            ) from e
+
+    elif config.provider == LLMProvider.GROQ:
+        try:
+            from ..llm_client.groq_client import GroqClient
+
+            return GroqClient(llm_config)
+        except ImportError as e:
+            raise ImportError(
+                'Groq client requires groq package. Install with: pip install graphiti-core[groq]'
+            ) from e
+
+    elif config.provider == LLMProvider.LITELLM:
+        try:
+            from ..llm_client.litellm_client import LiteLLMClient
+
+            # For LiteLLM, use the litellm_model if provided
+            if config.litellm_model:
+                llm_config.model = config.litellm_model
+            return LiteLLMClient(llm_config)
+        except ImportError as e:
+            raise ImportError(
+                'LiteLLM client requires litellm package. '
+                'Install with: pip install graphiti-core[litellm]'
+            ) from e
+
+    elif config.provider == LLMProvider.CUSTOM:
+        if not config.custom_client_class:
+            raise ValueError('custom_client_class is required for custom LLM provider')
+
+        # Import and instantiate custom client class
+        module_name, class_name = config.custom_client_class.rsplit('.', 1)
+        module = importlib.import_module(module_name)
+        client_class = getattr(module, class_name)
+        return client_class(llm_config)
+
+    else:
+        raise ValueError(f'Unsupported LLM provider: {config.provider}')
+
+
+def create_embedder(config: 'EmbedderConfig') -> EmbedderClient:
+    """Create an embedder client based on configuration.
+
+    Args:
+        config: Embedder configuration
+
+    Returns:
+        Configured embedder client instance
+
+    Raises:
+        ValueError: If provider is not supported or configuration is invalid
+        ImportError: If required dependencies for the provider are not installed
+    """
+    if config.provider == EmbedderProvider.OPENAI:
+        from ..embedder.openai import OpenAIEmbedder, OpenAIEmbedderConfig
+
+        embedder_config = OpenAIEmbedderConfig(
+            api_key=config.api_key,
+            embedding_model=config.model or 'text-embedding-3-small',
+            embedding_dim=config.dimensions or 1536,
+        )
+        return OpenAIEmbedder(config=embedder_config)
+
+    elif config.provider == EmbedderProvider.AZURE_OPENAI:
+        from openai import AsyncAzureOpenAI
+
+        from ..embedder.azure_openai import AzureOpenAIEmbedderClient  # type: ignore
+
+        if not config.base_url:
+            raise ValueError('base_url is required for Azure OpenAI embedder')
+
+        azure_client = AsyncAzureOpenAI(
+            api_key=config.api_key,
+            azure_endpoint=config.base_url,
+            api_version=config.azure_api_version or '2024-10-21',
+        )
+
+        return AzureOpenAIEmbedderClient(  # type: ignore
+            azure_client=azure_client,
+            model=config.azure_deployment or config.model or 'text-embedding-3-small',
+        )
+
+    elif config.provider == EmbedderProvider.VOYAGE:
+        try:
+            from ..embedder.voyage import VoyageEmbedder, VoyageEmbedderConfig  # type: ignore
+
+            voyage_config = VoyageEmbedderConfig(  # type: ignore
+                api_key=config.api_key,
+                embedding_model=config.model or 'voyage-3',
+            )
+            return VoyageEmbedder(config=voyage_config)  # type: ignore
+        except ImportError as e:
+            raise ImportError(
+                'Voyage embedder requires voyageai package. '
+                'Install with: pip install graphiti-core[voyageai]'
+            ) from e
+
+    elif config.provider == EmbedderProvider.GEMINI:
+        try:
+            from ..embedder.gemini import GeminiEmbedder, GeminiEmbedderConfig  # type: ignore
+
+            gemini_config = GeminiEmbedderConfig(  # type: ignore
+                api_key=config.api_key,
+                embedding_model=config.model or 'text-embedding-004',
+            )
+            return GeminiEmbedder(config=gemini_config)  # type: ignore
+        except ImportError as e:
+            raise ImportError(
+                'Gemini embedder requires google-genai package. '
+                'Install with: pip install graphiti-core[google-genai]'
+            ) from e
+
+    elif config.provider == EmbedderProvider.CUSTOM:
+        if not config.custom_client_class:
+            raise ValueError('custom_client_class is required for custom embedder provider')
+
+        # Import and instantiate custom embedder class
+        module_name, class_name = config.custom_client_class.rsplit('.', 1)
+        module = importlib.import_module(module_name)
+        embedder_class = getattr(module, class_name)
+        return embedder_class(api_key=config.api_key, model=config.model)
+
+    else:
+        raise ValueError(f'Unsupported embedder provider: {config.provider}')
+
+
+def create_reranker(config: 'RerankerConfig') -> CrossEncoderClient:
+    """Create a reranker/cross-encoder client based on configuration.
+
+    Args:
+        config: Reranker configuration
+
+    Returns:
+        Configured reranker client instance
+
+    Raises:
+        ValueError: If provider is not supported or configuration is invalid
+    """
+    if config.provider in (RerankerProvider.OPENAI, RerankerProvider.AZURE_OPENAI):
+        return OpenAIRerankerClient()
+
+    elif config.provider == RerankerProvider.CUSTOM:
+        if not config.custom_client_class:
+            raise ValueError('custom_client_class is required for custom reranker provider')
+
+        # Import and instantiate custom reranker class
+        module_name, class_name = config.custom_client_class.rsplit('.', 1)
+        module = importlib.import_module(module_name)
+        reranker_class = getattr(module, class_name)
+        return reranker_class()
+
+    else:
+        raise ValueError(f'Unsupported reranker provider: {config.provider}')
+
+
+def create_database_driver(config: 'DatabaseConfig') -> GraphDriver:
+    """Create a graph database driver based on configuration.
+
+    Args:
+        config: Database configuration
+
+    Returns:
+        Configured database driver instance
+
+    Raises:
+        ValueError: If provider is not supported or configuration is invalid
+        ImportError: If required dependencies for the provider are not installed
+    """
+    if config.provider == DatabaseProvider.NEO4J:
+        from ..driver.neo4j_driver import Neo4jDriver
+
+        if not config.uri:
+            raise ValueError('uri is required for Neo4j database')
+
+        return Neo4jDriver(
+            uri=config.uri,
+            user=config.user,
+            password=config.password,
+            database=config.database,  # type: ignore
+        )
+
+    elif config.provider == DatabaseProvider.FALKORDB:
+        try:
+            from ..driver.falkor_driver import FalkorDriver  # type: ignore
+
+            if not config.uri:
+                raise ValueError('uri is required for FalkorDB database')
+
+            return FalkorDriver(  # type: ignore
+                uri=config.uri,
+                user=config.user,
+                password=config.password,
+                database=config.database,  # type: ignore
+            )
+        except ImportError as e:
+            raise ImportError(
+                'FalkorDB driver requires falkordb package. '
+                'Install with: pip install graphiti-core[falkordb]'
+            ) from e
+
+    elif config.provider == DatabaseProvider.NEPTUNE:
+        try:
+            from ..driver.neptune_driver import NeptuneDriver  # type: ignore
+
+            if not config.uri:
+                raise ValueError('uri is required for Neptune database')
+
+            # Neptune driver has different signature - add type ignore
+            return NeptuneDriver(config.uri)  # type: ignore
+        except ImportError as e:
+            raise ImportError(
+                'Neptune driver requires langchain-aws and related packages. '
+                'Install with: pip install graphiti-core[neptune]'
+            ) from e
+
+    elif config.provider == DatabaseProvider.CUSTOM:
+        if not config.custom_driver_class:
+            raise ValueError('custom_driver_class is required for custom database provider')
+
+        # Import and instantiate custom driver class
+        module_name, class_name = config.custom_driver_class.rsplit('.', 1)
+        module = importlib.import_module(module_name)
+        driver_class = getattr(module, class_name)
+        return driver_class(uri=config.uri, user=config.user, password=config.password)
+
+    else:
+        raise ValueError(f'Unsupported database provider: {config.provider}')
diff --git a/graphiti_core/config/providers.py b/graphiti_core/config/providers.py
new file mode 100644
index 000000000..f14af79c5
--- /dev/null
+++ b/graphiti_core/config/providers.py
@@ -0,0 +1,100 @@
+"""
+Copyright 2024, Zep Software, Inc.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+from enum import Enum
+
+
+class LLMProvider(str, Enum):
+    """Supported LLM providers for Graphiti."""
+
+    OPENAI = 'openai'
+    AZURE_OPENAI = 'azure_openai'
+    ANTHROPIC = 'anthropic'
+    GEMINI = 'gemini'
+    GROQ = 'groq'
+    LITELLM = 'litellm'  # Unified interface for multiple providers
+    CUSTOM = 'custom'
+
+
+class EmbedderProvider(str, Enum):
+    """Supported embedding providers for Graphiti."""
+
+    OPENAI = 'openai'
+    AZURE_OPENAI = 'azure_openai'
+    VOYAGE = 'voyage'
+    GEMINI = 'gemini'
+    CUSTOM = 'custom'
+
+
+class DatabaseProvider(str, Enum):
+    """Supported graph database providers for Graphiti."""
+
+    NEO4J = 'neo4j'
+    FALKORDB = 'falkordb'
+    NEPTUNE = 'neptune'
+    CUSTOM = 'custom'
+
+
+class RerankerProvider(str, Enum):
+    """Supported reranker providers for Graphiti."""
+
+    OPENAI = 'openai'
+    AZURE_OPENAI = 'azure_openai'
+    CUSTOM = 'custom'
+
+
+# Provider-specific default models
+DEFAULT_MODELS = {
+    LLMProvider.OPENAI: {
+        'model': 'gpt-4.1-mini',
+        'small_model': 'gpt-4.1-nano',
+    },
+    LLMProvider.AZURE_OPENAI: {
+        'model': 'gpt-4.1-mini',
+        'small_model': 'gpt-4.1-nano',
+    },
+    LLMProvider.ANTHROPIC: {
+        'model': 'claude-sonnet-4-5-latest',
+        'small_model': 'claude-haiku-4-5-latest',
+    },
+    LLMProvider.GEMINI: {
+        'model': 'gemini-2.5-flash',
+        'small_model': 'gemini-2.5-flash',
+    },
+    LLMProvider.GROQ: {
+        'model': 'llama-3.1-70b-versatile',
+        'small_model': 'llama-3.1-8b-instant',
+    },
+}
+
+DEFAULT_EMBEDDINGS = {
+    EmbedderProvider.OPENAI: {
+        'model': 'text-embedding-3-small',
+        'dimensions': 1536,
+    },
+    EmbedderProvider.AZURE_OPENAI: {
+        'model': 'text-embedding-3-small',
+        'dimensions': 1536,
+    },
+    EmbedderProvider.VOYAGE: {
+        'model': 'voyage-3',
+        'dimensions': 1024,
+    },
+    EmbedderProvider.GEMINI: {
+        'model': 'text-embedding-004',
+        'dimensions': 768,
+    },
+}
diff --git a/graphiti_core/config/settings.py b/graphiti_core/config/settings.py
new file mode 100644
index 000000000..9cef81304
--- /dev/null
+++ b/graphiti_core/config/settings.py
@@ -0,0 +1,459 @@
+"""
+Copyright 2024, Zep Software, Inc.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import os
+from pathlib import Path
+from typing import Any
+
+import yaml
+from pydantic import BaseModel, Field, model_validator
+
+from .providers import (
+    DEFAULT_EMBEDDINGS,
+    DEFAULT_MODELS,
+    DatabaseProvider,
+    EmbedderProvider,
+    LLMProvider,
+    RerankerProvider,
+)
+
+
+class LLMProviderConfig(BaseModel):
+    """Configuration for LLM provider.
+
+    This configuration supports multiple LLM providers including OpenAI, Azure OpenAI,
+    Anthropic, Gemini, Groq, and generic providers via LiteLLM.
+
+    Examples:
+        >>> # OpenAI configuration
+        >>> config = LLMProviderConfig(
+        ...     provider=LLMProvider.OPENAI,
+        ...     api_key='sk-...',
+        ... )
+
+        >>> # Azure OpenAI configuration
+        >>> config = LLMProviderConfig(
+        ...     provider=LLMProvider.AZURE_OPENAI,
+        ...     api_key='...',
+        ...     base_url='https://your-resource.openai.azure.com',
+        ...     azure_deployment='your-deployment-name',
+        ... )
+
+        >>> # Anthropic configuration
+        >>> config = LLMProviderConfig(
+        ...     provider=LLMProvider.ANTHROPIC,
+        ...     model='claude-sonnet-4-5-latest',
+        ... )
+    """
+
+    provider: LLMProvider = Field(
+        default=LLMProvider.OPENAI,
+        description='The LLM provider to use',
+    )
+    model: str | None = Field(
+        default=None,
+        description='The model name to use. If not provided, uses provider default.',
+    )
+    small_model: str | None = Field(
+        default=None,
+        description='Smaller/faster model for simpler tasks. If not provided, uses provider default.',
+    )
+    api_key: str | None = Field(
+        default=None,
+        description='API key for the provider. Falls back to environment variables if not provided.',
+    )
+    base_url: str | None = Field(
+        default=None,
+        description='Base URL for the API. Required for Azure OpenAI and custom endpoints.',
+    )
+    temperature: float = Field(
+        default=1.0,
+        ge=0.0,
+        le=2.0,
+        description='Temperature for response generation',
+    )
+    max_tokens: int = Field(
+        default=8192,
+        gt=0,
+        description='Maximum tokens for response generation',
+    )
+
+    # Azure-specific fields
+    azure_deployment: str | None = Field(
+        default=None,
+        description='Azure OpenAI deployment name (required for Azure provider)',
+    )
+    azure_api_version: str | None = Field(
+        default='2024-10-21',
+        description='Azure OpenAI API version',
+    )
+
+    # LiteLLM-specific fields
+    litellm_model: str | None = Field(
+        default=None,
+        description='Full LiteLLM model string (e.g., "azure/gpt-4", "bedrock/claude-3")',
+    )
+
+    # Custom provider fields
+    custom_client_class: str | None = Field(
+        default=None,
+        description='Fully qualified class name for custom LLM client',
+    )
+
+    @model_validator(mode='after')
+    def set_defaults_and_validate(self) -> 'LLMProviderConfig':
+        """Set provider-specific defaults and validate configuration."""
+        # Set default models if not provided
+        if self.model is None and self.provider in DEFAULT_MODELS:
+            self.model = DEFAULT_MODELS[self.provider]['model']
+
+        if self.small_model is None and self.provider in DEFAULT_MODELS:
+            self.small_model = DEFAULT_MODELS[self.provider]['small_model']
+
+        # Set API key from environment if not provided
+        if self.api_key is None:
+            if self.provider == LLMProvider.OPENAI:
+                self.api_key = os.getenv('OPENAI_API_KEY')
+            elif self.provider == LLMProvider.AZURE_OPENAI:
+                self.api_key = os.getenv('AZURE_OPENAI_API_KEY')
+            elif self.provider == LLMProvider.ANTHROPIC:
+                self.api_key = os.getenv('ANTHROPIC_API_KEY')
+            elif self.provider == LLMProvider.GEMINI:
+                self.api_key = os.getenv('GOOGLE_API_KEY')
+            elif self.provider == LLMProvider.GROQ:
+                self.api_key = os.getenv('GROQ_API_KEY')
+
+        # Validate Azure-specific requirements
+        if self.provider == LLMProvider.AZURE_OPENAI:
+            if not self.base_url:
+                raise ValueError('base_url is required for Azure OpenAI provider')
+            if not self.azure_deployment and not self.model:
+                raise ValueError(
+                    'Either azure_deployment or model must be provided for Azure OpenAI'
+                )
+
+        # Validate LiteLLM requirements
+        if self.provider == LLMProvider.LITELLM and not self.litellm_model:
+            raise ValueError('litellm_model is required for LiteLLM provider')
+
+        # Validate custom provider requirements
+        if self.provider == LLMProvider.CUSTOM and not self.custom_client_class:
+            raise ValueError('custom_client_class is required for custom provider')
+
+        return self
+
+
+class EmbedderConfig(BaseModel):
+    """Configuration for embedding provider.
+
+    Examples:
+        >>> # OpenAI embeddings
+        >>> config = EmbedderConfig(
+        ...     provider=EmbedderProvider.OPENAI,
+        ... )
+
+        >>> # Voyage AI embeddings
+        >>> config = EmbedderConfig(
+        ...     provider=EmbedderProvider.VOYAGE,
+        ...     model='voyage-3',
+        ... )
+    """
+
+    provider: EmbedderProvider = Field(
+        default=EmbedderProvider.OPENAI,
+        description='The embedder provider to use',
+    )
+    model: str | None = Field(
+        default=None,
+        description='The embedding model name. If not provided, uses provider default.',
+    )
+    api_key: str | None = Field(
+        default=None,
+        description='API key for the provider. Falls back to environment variables if not provided.',
+    )
+    base_url: str | None = Field(
+        default=None,
+        description='Base URL for the API. Required for Azure OpenAI.',
+    )
+    dimensions: int | None = Field(
+        default=None,
+        description='Embedding dimensions. If not provided, uses provider default.',
+    )
+
+    # Azure-specific fields
+    azure_deployment: str | None = Field(
+        default=None,
+        description='Azure OpenAI deployment name (required for Azure provider)',
+    )
+    azure_api_version: str | None = Field(
+        default='2024-10-21',
+        description='Azure OpenAI API version',
+    )
+
+    # Custom provider fields
+    custom_client_class: str | None = Field(
+        default=None,
+        description='Fully qualified class name for custom embedder client',
+    )
+
+    @model_validator(mode='after')
+    def set_defaults_and_validate(self) -> 'EmbedderConfig':
+        """Set provider-specific defaults and validate configuration."""
+        # Set default model and dimensions if not provided
+        if self.provider in DEFAULT_EMBEDDINGS:
+            if self.model is None:
+                self.model = DEFAULT_EMBEDDINGS[self.provider]['model']
+            if self.dimensions is None:
+                self.dimensions = DEFAULT_EMBEDDINGS[self.provider]['dimensions']
+
+        # Set API key from environment if not provided
+        if self.api_key is None:
+            if self.provider == EmbedderProvider.OPENAI:
+                self.api_key = os.getenv('OPENAI_API_KEY')
+            elif self.provider == EmbedderProvider.AZURE_OPENAI:
+                self.api_key = os.getenv('AZURE_OPENAI_API_KEY')
+            elif self.provider == EmbedderProvider.VOYAGE:
+                self.api_key = os.getenv('VOYAGE_API_KEY')
+            elif self.provider == EmbedderProvider.GEMINI:
+                self.api_key = os.getenv('GOOGLE_API_KEY')
+
+        # Validate Azure-specific requirements
+        if self.provider == EmbedderProvider.AZURE_OPENAI and not self.base_url:
+            raise ValueError('base_url is required for Azure OpenAI embedder')
+
+        # Validate custom provider requirements
+        if self.provider == EmbedderProvider.CUSTOM and not self.custom_client_class:
+            raise ValueError('custom_client_class is required for custom embedder')
+
+        return self
+
+
+class RerankerConfig(BaseModel):
+    """Configuration for reranker/cross-encoder provider.
+
+    Examples:
+        >>> config = RerankerConfig(
+        ...     provider=RerankerProvider.OPENAI,
+        ... )
+    """
+
+    provider: RerankerProvider = Field(
+        default=RerankerProvider.OPENAI,
+        description='The reranker provider to use',
+    )
+    api_key: str | None = Field(
+        default=None,
+        description='API key for the provider. Falls back to environment variables if not provided.',
+    )
+    base_url: str | None = Field(
+        default=None,
+        description='Base URL for the API.',
+    )
+
+    # Azure-specific fields
+    azure_deployment: str | None = Field(
+        default=None,
+        description='Azure OpenAI deployment name (required for Azure provider)',
+    )
+
+    # Custom provider fields
+    custom_client_class: str | None = Field(
+        default=None,
+        description='Fully qualified class name for custom reranker client',
+    )
+
+    @model_validator(mode='after')
+    def set_defaults(self) -> 'RerankerConfig':
+        """Set provider-specific defaults."""
+        # Set API key from environment if not provided
+        if self.api_key is None:
+            if self.provider == RerankerProvider.OPENAI:
+                self.api_key = os.getenv('OPENAI_API_KEY')
+            elif self.provider == RerankerProvider.AZURE_OPENAI:
+                self.api_key = os.getenv('AZURE_OPENAI_API_KEY')
+
+        return self
+
+
+class DatabaseConfig(BaseModel):
+    """Configuration for graph database.
+
+    Examples:
+        >>> # Neo4j configuration
+        >>> config = DatabaseConfig(
+        ...     provider=DatabaseProvider.NEO4J,
+        ...     uri='bolt://localhost:7687',
+        ...     user='neo4j',
+        ...     password='password',
+        ... )
+
+        >>> # FalkorDB configuration
+        >>> config = DatabaseConfig(
+        ...     provider=DatabaseProvider.FALKORDB,
+        ...     uri='redis://localhost:6379',
+        ... )
+    """
+
+    provider: DatabaseProvider = Field(
+        default=DatabaseProvider.NEO4J,
+        description='The graph database provider to use',
+    )
+    uri: str | None = Field(
+        default=None,
+        description='Database connection URI',
+    )
+    user: str | None = Field(
+        default=None,
+        description='Database username',
+    )
+    password: str | None = Field(
+        default=None,
+        description='Database password',
+    )
+    database: str | None = Field(
+        default=None,
+        description='Database name. Uses provider default if not specified.',
+    )
+
+    # Custom provider fields
+    custom_driver_class: str | None = Field(
+        default=None,
+        description='Fully qualified class name for custom database driver',
+    )
+
+    @model_validator(mode='after')
+    def validate_database_config(self) -> 'DatabaseConfig':
+        """Validate database configuration."""
+        if self.provider == DatabaseProvider.CUSTOM and not self.custom_driver_class:
+            raise ValueError('custom_driver_class is required for custom database provider')
+        return self
+
+
+class GraphitiConfig(BaseModel):
+    """Main Graphiti configuration.
+
+    This is the primary configuration class that aggregates all provider configurations.
+    It supports loading from YAML files, environment variables, and programmatic configuration.
+
+    Examples:
+        >>> # Programmatic configuration
+        >>> config = GraphitiConfig(
+        ...     llm=LLMProviderConfig(provider=LLMProvider.ANTHROPIC),
+        ...     embedder=EmbedderConfig(provider=EmbedderProvider.VOYAGE),
+        ...     database=DatabaseConfig(
+        ...         uri='bolt://localhost:7687',
+        ...         user='neo4j',
+        ...         password='password',
+        ...     ),
+        ... )
+
+        >>> # Load from YAML file
+        >>> config = GraphitiConfig.from_yaml('graphiti.yaml')
+
+        >>> # Load from environment (looks for GRAPHITI_CONFIG_PATH)
+        >>> config = GraphitiConfig.from_env()
+    """
+
+    llm: LLMProviderConfig = Field(
+        default_factory=LLMProviderConfig,
+        description='LLM provider configuration',
+    )
+    embedder: EmbedderConfig = Field(
+        default_factory=EmbedderConfig,
+        description='Embedder provider configuration',
+    )
+    reranker: RerankerConfig = Field(
+        default_factory=RerankerConfig,
+        description='Reranker provider configuration',
+    )
+    database: DatabaseConfig = Field(
+        default_factory=DatabaseConfig,
+        description='Database provider configuration',
+    )
+
+    # General settings
+    store_raw_episode_content: bool = Field(
+        default=True,
+        description='Whether to store raw episode content in the database',
+    )
+    max_coroutines: int | None = Field(
+        default=None,
+        description='Maximum number of concurrent operations',
+    )
+
+    @classmethod
+    def from_yaml(cls, path: str | Path) -> 'GraphitiConfig':
+        """Load configuration from a YAML file.
+
+        Args:
+            path: Path to the YAML configuration file
+
+        Returns:
+            GraphitiConfig instance loaded from the file
+
+        Raises:
+            FileNotFoundError: If the configuration file doesn't exist
+            ValueError: If the YAML file is invalid
+        """
+        path = Path(path)
+        if not path.exists():
+            raise FileNotFoundError(f'Configuration file not found: {path}')
+
+        with open(path) as f:
+            config_dict = yaml.safe_load(f)
+
+        if config_dict is None:
+            config_dict = {}
+
+        return cls(**config_dict)
+
+    @classmethod
+    def from_env(cls, env_var: str = 'GRAPHITI_CONFIG_PATH') -> 'GraphitiConfig':
+        """Load configuration from a YAML file specified in an environment variable.
+
+        Args:
+            env_var: Name of the environment variable containing the config file path
+
+        Returns:
+            GraphitiConfig instance loaded from the file, or default config if env var not set
+
+        Raises:
+            FileNotFoundError: If the specified config file doesn't exist
+        """
+        config_path = os.getenv(env_var)
+        if config_path:
+            return cls.from_yaml(config_path)
+
+        # Look for default config files in current directory
+        for default_file in ['.graphiti.yaml', '.graphiti.yml', 'graphiti.yaml', 'graphiti.yml']:
+            if Path(default_file).exists():
+                return cls.from_yaml(default_file)
+
+        # Return default configuration
+        return cls()
+
+    def to_yaml(self, path: str | Path) -> None:
+        """Save configuration to a YAML file.
+
+        Args:
+            path: Path where the configuration file should be saved
+        """
+        path = Path(path)
+        # Use json mode to convert enums to their values
+        config_dict = self.model_dump(exclude_none=True, mode='json')
+
+        with open(path, 'w') as f:
+            yaml.dump(config_dict, f, default_flow_style=False, sort_keys=False)
diff --git a/graphiti_core/graphiti.py b/graphiti_core/graphiti.py
index c4fa60c51..0c3c5e81a 100644
--- a/graphiti_core/graphiti.py
+++ b/graphiti_core/graphiti.py
@@ -17,11 +17,15 @@
 import logging
 from datetime import datetime
 from time import time
+from typing import TYPE_CHECKING
 
 from dotenv import load_dotenv
 from pydantic import BaseModel
 from typing_extensions import LiteralString
 
+if TYPE_CHECKING:
+    from graphiti_core.config import GraphitiConfig
+
 from graphiti_core.cross_encoder.client import CrossEncoderClient
 from graphiti_core.cross_encoder.openai_reranker_client import OpenAIRerankerClient
 from graphiti_core.decorators import handle_multiple_group_ids
@@ -139,6 +143,7 @@ def __init__(
         max_coroutines: int | None = None,
         tracer: Tracer | None = None,
         trace_span_prefix: str = 'graphiti',
+        config: 'GraphitiConfig | None' = None,
     ):
         """
         Initialize a Graphiti instance.
@@ -175,6 +180,9 @@ def __init__(
             An OpenTelemetry tracer instance for distributed tracing. If not provided, tracing is disabled (no-op).
         trace_span_prefix : str, optional
             Prefix to prepend to all span names. Defaults to 'graphiti'.
+        config : GraphitiConfig | None, optional
+            A GraphitiConfig instance for unified configuration. If provided, it takes precedence
+            over individual parameters. Allows configuration via YAML files or programmatically.
 
         Returns
         -------
@@ -186,36 +194,91 @@ def __init__(
         credentials. It also sets up the LLM client, either using the provided client
         or by creating a default OpenAIClient.
 
-        The default database name is defined during the driver’s construction. If a different database name
+        The default database name is defined during the driver's construction. If a different database name
         is required, it should be specified in the URI or set separately after
         initialization.
 
         The OpenAI API key is expected to be set in the environment variables.
         Make sure to set the OPENAI_API_KEY environment variable before initializing
         Graphiti if you're using the default OpenAIClient.
+
+        Examples:
+            >>> # Traditional initialization
+            >>> graphiti = Graphiti(uri='bolt://localhost:7687', user='neo4j', password='password')
+
+            >>> # New config-based initialization
+            >>> from graphiti_core.config import GraphitiConfig, LLMProviderConfig, LLMProvider
+            >>> config = GraphitiConfig.from_yaml('graphiti.yaml')
+            >>> graphiti = Graphiti(config=config)
+
+            >>> # Or use the factory method
+            >>> graphiti = Graphiti.from_config(config)
         """
 
-        if graph_driver:
-            self.driver = graph_driver
-        else:
-            if uri is None:
-                raise ValueError('uri must be provided when graph_driver is None')
-            self.driver = Neo4jDriver(uri, user, password)
-
-        self.store_raw_episode_content = store_raw_episode_content
-        self.max_coroutines = max_coroutines
-        if llm_client:
-            self.llm_client = llm_client
-        else:
-            self.llm_client = OpenAIClient()
-        if embedder:
-            self.embedder = embedder
-        else:
-            self.embedder = OpenAIEmbedder()
-        if cross_encoder:
-            self.cross_encoder = cross_encoder
+        # If config is provided, use it to initialize clients
+        if config is not None:
+            from graphiti_core.config.factory import (
+                create_database_driver,
+                create_embedder,
+                create_llm_client,
+                create_reranker,
+            )
+
+            # Use config values, allowing individual params to override
+            if graph_driver is None:
+                self.driver = create_database_driver(config.database)
+            else:
+                self.driver = graph_driver
+
+            if llm_client is None:
+                self.llm_client = create_llm_client(config.llm)
+            else:
+                self.llm_client = llm_client
+
+            if embedder is None:
+                self.embedder = create_embedder(config.embedder)
+            else:
+                self.embedder = embedder
+
+            if cross_encoder is None:
+                self.cross_encoder = create_reranker(config.reranker)
+            else:
+                self.cross_encoder = cross_encoder
+
+            self.store_raw_episode_content = (
+                store_raw_episode_content
+                if store_raw_episode_content is not None
+                else config.store_raw_episode_content
+            )
+            self.max_coroutines = (
+                max_coroutines if max_coroutines is not None else config.max_coroutines
+            )
+
         else:
-            self.cross_encoder = OpenAIRerankerClient()
+            # Traditional initialization path (backward compatible)
+            if graph_driver:
+                self.driver = graph_driver
+            else:
+                if uri is None:
+                    raise ValueError(
+                        'uri must be provided when graph_driver is None and config is None'
+                    )
+                self.driver = Neo4jDriver(uri, user, password)
+
+            self.store_raw_episode_content = store_raw_episode_content
+            self.max_coroutines = max_coroutines
+            if llm_client:
+                self.llm_client = llm_client
+            else:
+                self.llm_client = OpenAIClient()
+            if embedder:
+                self.embedder = embedder
+            else:
+                self.embedder = OpenAIEmbedder()
+            if cross_encoder:
+                self.cross_encoder = cross_encoder
+            else:
+                self.cross_encoder = OpenAIRerankerClient()
 
         # Initialize tracer
         self.tracer = create_tracer(tracer, trace_span_prefix)
@@ -234,6 +297,44 @@ def __init__(
         # Capture telemetry event
         self._capture_initialization_telemetry()
 
+    @classmethod
+    def from_config(
+        cls,
+        config: 'GraphitiConfig',
+        tracer: Tracer | None = None,
+        trace_span_prefix: str = 'graphiti',
+    ) -> 'Graphiti':
+        """Create a Graphiti instance from a GraphitiConfig.
+
+        This is a convenience method for creating Graphiti instances using the
+        new configuration system.
+
+        Parameters
+        ----------
+        config : GraphitiConfig
+            The configuration object containing all settings
+        tracer : Tracer | None, optional
+            An OpenTelemetry tracer instance for distributed tracing
+        trace_span_prefix : str, optional
+            Prefix to prepend to all span names
+
+        Returns
+        -------
+        Graphiti
+            A new Graphiti instance configured according to the provided config
+
+        Examples
+        --------
+        >>> from graphiti_core.config import GraphitiConfig
+        >>> config = GraphitiConfig.from_yaml('graphiti.yaml')
+        >>> graphiti = Graphiti.from_config(config)
+
+        >>> # Or with environment-based config
+        >>> config = GraphitiConfig.from_env()
+        >>> graphiti = Graphiti.from_config(config)
+        """
+        return cls(config=config, tracer=tracer, trace_span_prefix=trace_span_prefix)
+
     def _capture_initialization_telemetry(self):
         """Capture telemetry event for Graphiti initialization."""
         try:
diff --git a/graphiti_core/llm_client/litellm_client.py b/graphiti_core/llm_client/litellm_client.py
new file mode 100644
index 000000000..4d5ad7ea6
--- /dev/null
+++ b/graphiti_core/llm_client/litellm_client.py
@@ -0,0 +1,267 @@
+"""
+Copyright 2024, Zep Software, Inc.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import logging
+import typing
+
+from pydantic import BaseModel
+
+from ..prompts.models import Message
+from .client import LLMClient
+from .config import DEFAULT_MAX_TOKENS, LLMConfig, ModelSize
+from .errors import RateLimitError
+
+logger = logging.getLogger(__name__)
+
+try:
+    import litellm  # type: ignore
+    from litellm import acompletion  # type: ignore
+
+    LITELLM_AVAILABLE = True
+except ImportError:
+    LITELLM_AVAILABLE = False
+    logger.warning('LiteLLM not available. Install with: pip install graphiti-core[litellm]')
+
+
+class LiteLLMClient(LLMClient):
+    """LLM client using LiteLLM for unified multi-provider support.
+
+    LiteLLM provides a unified interface to 100+ LLM providers including:
+    - OpenAI, Azure OpenAI
+    - Anthropic
+    - Google (Gemini, Vertex AI)
+    - AWS Bedrock
+    - Cohere, Replicate, HuggingFace
+    - Local models (Ollama, vLLM, LocalAI)
+    - And many more
+
+    Examples:
+        >>> # OpenAI via LiteLLM
+        >>> client = LiteLLMClient(
+        ...     LLMConfig(
+        ...         model='gpt-4.1-mini',
+        ...         api_key='sk-...',
+        ...     )
+        ... )
+
+        >>> # Azure OpenAI
+        >>> client = LiteLLMClient(
+        ...     LLMConfig(
+        ...         model='azure/gpt-4-deployment-name',
+        ...         base_url='https://your-resource.openai.azure.com',
+        ...         api_key='...',
+        ...     )
+        ... )
+
+        >>> # AWS Bedrock
+        >>> client = LiteLLMClient(
+        ...     LLMConfig(
+        ...         model='bedrock/anthropic.claude-3-sonnet-20240229-v1:0',
+        ...     )
+        ... )
+
+        >>> # Ollama (local)
+        >>> client = LiteLLMClient(
+        ...     LLMConfig(
+        ...         model='ollama/llama2',
+        ...         base_url='http://localhost:11434',
+        ...     )
+        ... )
+    """
+
+    def __init__(self, config: LLMConfig | None = None, cache: bool = False):
+        """Initialize LiteLLM client.
+
+        Args:
+            config: LLM configuration. Model name should follow LiteLLM conventions.
+            cache: Whether to enable response caching.
+
+        Raises:
+            ImportError: If LiteLLM is not installed.
+        """
+        if not LITELLM_AVAILABLE:
+            raise ImportError(
+                'LiteLLM is required for LiteLLMClient. '
+                'Install with: pip install graphiti-core[litellm]'
+            )
+
+        super().__init__(config, cache)
+
+        # Configure LiteLLM
+        if self.config.base_url:
+            litellm.api_base = self.config.base_url
+
+        if self.config.api_key:
+            litellm.api_key = self.config.api_key
+
+        # Disable verbose logging by default
+        litellm.suppress_debug_info = True
+
+        logger.info(f'Initialized LiteLLM client with model: {self.model}')
+
+    async def _generate_response(
+        self,
+        messages: list[Message],
+        response_model: type[BaseModel] | None = None,
+        max_tokens: int = DEFAULT_MAX_TOKENS,
+        model_size: ModelSize = ModelSize.medium,
+    ) -> dict[str, typing.Any]:
+        """Generate a response using LiteLLM.
+
+        Args:
+            messages: List of conversation messages
+            response_model: Optional Pydantic model for structured output
+            max_tokens: Maximum tokens in response
+            model_size: Size of model to use (medium or small)
+
+        Returns:
+            Dictionary containing the response data
+
+        Raises:
+            RateLimitError: If rate limit is exceeded
+            Exception: For other errors from the LLM provider
+        """
+        # Select model based on size
+        model = self.model if model_size == ModelSize.medium else self.small_model
+
+        if not model:
+            raise ValueError('Model must be specified for LiteLLM client')
+
+        # Convert messages to LiteLLM format
+        litellm_messages = [
+            {'role': msg.role, 'content': self._clean_input(msg.content)} for msg in messages
+        ]
+
+        try:
+            # Check if provider supports structured output
+            supports_structured = self._supports_structured_output(model)
+
+            if response_model and supports_structured:
+                # Use LiteLLM's structured output support
+                with self.tracer.start_span('litellm_completion') as span:
+                    span.add_attributes(
+                        {
+                            'model': model,
+                            'structured_output': True,
+                            'max_tokens': max_tokens,
+                        }
+                    )
+
+                    response = await acompletion(
+                        model=model,
+                        messages=litellm_messages,
+                        temperature=self.temperature,
+                        max_tokens=max_tokens,
+                        response_format={'type': 'json_object'},
+                    )
+
+                    # Parse JSON response into Pydantic model
+                    content = response.choices[0].message.content
+                    import json
+
+                    result = json.loads(content)
+
+                    # Validate with response model
+                    if response_model:
+                        validated = response_model(**result)
+                        return validated.model_dump()
+
+                    return result
+
+            elif response_model:
+                # Fallback: Use OpenAI-style function calling or prompt engineering
+                with self.tracer.start_span('litellm_completion_json') as span:
+                    span.add_attributes(
+                        {
+                            'model': model,
+                            'structured_output': False,
+                            'max_tokens': max_tokens,
+                        }
+                    )
+
+                    # Add JSON schema to the last message
+                    schema_str = response_model.model_json_schema()
+                    litellm_messages[-1]['content'] += (
+                        f'\n\nRespond with valid JSON matching this schema: {schema_str}'
+                    )
+
+                    response = await acompletion(
+                        model=model,
+                        messages=litellm_messages,
+                        temperature=self.temperature,
+                        max_tokens=max_tokens,
+                    )
+
+                    content = response.choices[0].message.content
+                    import json
+
+                    # Try to parse JSON from response
+                    result = json.loads(content)
+                    validated = response_model(**result)
+                    return validated.model_dump()
+
+            else:
+                # Regular completion without structured output
+                with self.tracer.start_span('litellm_completion_text') as span:
+                    span.add_attributes(
+                        {
+                            'model': model,
+                            'max_tokens': max_tokens,
+                        }
+                    )
+
+                    response = await acompletion(
+                        model=model,
+                        messages=litellm_messages,
+                        temperature=self.temperature,
+                        max_tokens=max_tokens,
+                    )
+
+                    return {'content': response.choices[0].message.content}
+
+        except Exception as e:
+            error_str = str(e).lower()
+
+            # Check for rate limiting
+            if 'rate limit' in error_str or 'quota' in error_str or '429' in error_str:
+                raise RateLimitError(f'Rate limit exceeded for model {model}: {e}') from e
+
+            # Re-raise other exceptions
+            logger.error(f'Error generating response with LiteLLM: {e}')
+            raise
+
+    def _supports_structured_output(self, model: str) -> bool:
+        """Check if a model supports structured JSON output.
+
+        Args:
+            model: Model identifier (e.g., "gpt-4", "azure/gpt-4", "bedrock/claude-3")
+
+        Returns:
+            True if the model supports structured output, False otherwise
+        """
+        # Extract base model name from LiteLLM format
+        model_lower = model.lower()
+
+        # OpenAI models with structured output support
+        if any(x in model_lower for x in ['gpt-4', 'gpt-3.5', 'gpt-4.1', 'gpt-5', 'o1', 'o3']):
+            return True
+
+        # Gemini models support JSON mode
+        if 'gemini' in model_lower:
+            return True
+
+        # Claude 3+ models support JSON mode
+        return 'claude-3' in model_lower or 'claude-4' in model_lower
diff --git a/pyproject.toml b/pyproject.toml
index 7927dc72e..b2e5f05c8 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -18,7 +18,8 @@ dependencies = [
     "tenacity>=9.0.0",
     "numpy>=1.0.0",
     "python-dotenv>=1.0.1",
-    "posthog>=3.0.0"
+    "posthog>=3.0.0",
+    "pyyaml>=6.0.0"
 ]
 
 [project.urls]
@@ -36,6 +37,7 @@ neo4j-opensearch = ["boto3>=1.39.16", "opensearch-py>=3.0.0"]
 sentence-transformers = ["sentence-transformers>=3.2.1"]
 neptune = ["langchain-aws>=0.2.29", "opensearch-py>=3.0.0", "boto3>=1.39.16"]
 tracing = ["opentelemetry-api>=1.20.0", "opentelemetry-sdk>=1.20.0"]
+litellm = ["litellm>=1.52.0"]
 dev = [
     "pyright>=1.1.404",
     "groq>=0.2.0",
diff --git a/tests/config/test_factory.py b/tests/config/test_factory.py
new file mode 100644
index 000000000..47e7859c6
--- /dev/null
+++ b/tests/config/test_factory.py
@@ -0,0 +1,189 @@
+"""
+Copyright 2024, Zep Software, Inc.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import pytest
+
+from graphiti_core.config import (
+    DatabaseConfig,
+    EmbedderConfig,
+    EmbedderProvider,
+    LLMProvider,
+    LLMProviderConfig,
+    RerankerConfig,
+)
+from graphiti_core.config.factory import (
+    create_database_driver,
+    create_embedder,
+    create_llm_client,
+    create_reranker,
+)
+from graphiti_core.config.providers import DatabaseProvider, RerankerProvider
+from graphiti_core.cross_encoder.openai_reranker_client import OpenAIRerankerClient
+from graphiti_core.embedder.openai import OpenAIEmbedder
+from graphiti_core.llm_client.openai_client import OpenAIClient
+
+
+class TestCreateLLMClient:
+    def test_create_openai_client(self, monkeypatch):
+        """Test creating OpenAI LLM client."""
+        monkeypatch.setenv('OPENAI_API_KEY', 'test-key')
+
+        config = LLMProviderConfig(provider=LLMProvider.OPENAI)
+        client = create_llm_client(config)
+
+        assert isinstance(client, OpenAIClient)
+        assert client.model == 'gpt-4.1-mini'
+        assert client.small_model == 'gpt-4.1-nano'
+
+    def test_create_azure_openai_client(self, monkeypatch):
+        """Test creating Azure OpenAI LLM client."""
+        from graphiti_core.llm_client.azure_openai_client import AzureOpenAILLMClient
+
+        monkeypatch.setenv('AZURE_OPENAI_API_KEY', 'test-key')
+
+        config = LLMProviderConfig(
+            provider=LLMProvider.AZURE_OPENAI,
+            base_url='https://my-resource.openai.azure.com',
+            azure_deployment='gpt-4-deployment',
+        )
+        client = create_llm_client(config)
+
+        assert isinstance(client, AzureOpenAILLMClient)
+
+    def test_create_anthropic_client_missing_dep(self):
+        """Test creating Anthropic client without dependency raises error."""
+        config = LLMProviderConfig(provider=LLMProvider.ANTHROPIC)
+
+        # This test will pass if anthropic is installed (in dev env)
+        # or raise ImportError if not installed
+        try:
+            client = create_llm_client(config)
+            from graphiti_core.llm_client.anthropic_client import AnthropicClient
+
+            assert isinstance(client, AnthropicClient)
+        except ImportError as e:
+            assert 'anthropic' in str(e).lower()
+
+    def test_create_litellm_client_missing_dep(self):
+        """Test creating LiteLLM client without dependency raises error."""
+        config = LLMProviderConfig(
+            provider=LLMProvider.LITELLM,
+            litellm_model='gpt-4',
+        )
+
+        # This will raise ImportError if litellm is not installed
+        try:
+            client = create_llm_client(config)
+            from graphiti_core.llm_client.litellm_client import LiteLLMClient
+
+            assert isinstance(client, LiteLLMClient)
+        except ImportError as e:
+            assert 'litellm' in str(e).lower()
+
+    def test_unsupported_provider_raises_error(self):
+        """Test unsupported provider raises ValueError."""
+        # We need to bypass pydantic validation to test this
+        config = LLMProviderConfig(provider=LLMProvider.OPENAI)
+        config.provider = 'unsupported'  # type: ignore
+
+        with pytest.raises(ValueError, match='Unsupported LLM provider'):
+            create_llm_client(config)
+
+
+class TestCreateEmbedder:
+    def test_create_openai_embedder(self, monkeypatch):
+        """Test creating OpenAI embedder."""
+        monkeypatch.setenv('OPENAI_API_KEY', 'test-key')
+
+        config = EmbedderConfig(provider=EmbedderProvider.OPENAI)
+        embedder = create_embedder(config)
+
+        assert isinstance(embedder, OpenAIEmbedder)
+        assert embedder.config.embedding_model == 'text-embedding-3-small'
+
+    def test_create_voyage_embedder_missing_dep(self):
+        """Test creating Voyage embedder without dependency."""
+        config = EmbedderConfig(provider=EmbedderProvider.VOYAGE)
+
+        try:
+            embedder = create_embedder(config)
+            from graphiti_core.embedder.voyage import VoyageEmbedder
+
+            assert isinstance(embedder, VoyageEmbedder)
+        except ImportError as e:
+            assert 'voyageai' in str(e).lower()
+
+    def test_create_azure_openai_embedder(self, monkeypatch):
+        """Test creating Azure OpenAI embedder."""
+        from graphiti_core.embedder.azure_openai import AzureOpenAIEmbedderClient
+
+        monkeypatch.setenv('AZURE_OPENAI_API_KEY', 'test-key')
+
+        config = EmbedderConfig(
+            provider=EmbedderProvider.AZURE_OPENAI,
+            base_url='https://my-resource.openai.azure.com',
+            azure_deployment='embedding-deployment',
+        )
+        embedder = create_embedder(config)
+
+        assert isinstance(embedder, AzureOpenAIEmbedderClient)
+
+
+class TestCreateReranker:
+    def test_create_openai_reranker(self):
+        """Test creating OpenAI reranker."""
+        config = RerankerConfig(provider=RerankerProvider.OPENAI)
+        reranker = create_reranker(config)
+
+        assert isinstance(reranker, OpenAIRerankerClient)
+
+
+class TestCreateDatabaseDriver:
+    def test_create_neo4j_driver(self):
+        """Test creating Neo4j driver."""
+        from graphiti_core.driver.neo4j_driver import Neo4jDriver
+
+        config = DatabaseConfig(
+            provider=DatabaseProvider.NEO4J,
+            uri='bolt://localhost:7687',
+            user='neo4j',
+            password='password',
+        )
+        driver = create_database_driver(config)
+
+        assert isinstance(driver, Neo4jDriver)
+
+    def test_neo4j_driver_missing_uri(self):
+        """Test Neo4j driver without URI raises error."""
+        config = DatabaseConfig(provider=DatabaseProvider.NEO4J)
+
+        with pytest.raises(ValueError, match='uri is required'):
+            create_database_driver(config)
+
+    def test_create_falkordb_driver_missing_dep(self):
+        """Test creating FalkorDB driver without dependency."""
+        config = DatabaseConfig(
+            provider=DatabaseProvider.FALKORDB,
+            uri='redis://localhost:6379',
+        )
+
+        try:
+            driver = create_database_driver(config)
+            from graphiti_core.driver.falkor_driver import FalkorDriver
+
+            assert isinstance(driver, FalkorDriver)
+        except ImportError as e:
+            assert 'falkordb' in str(e).lower()
diff --git a/tests/config/test_settings.py b/tests/config/test_settings.py
new file mode 100644
index 000000000..7a7bc8b99
--- /dev/null
+++ b/tests/config/test_settings.py
@@ -0,0 +1,261 @@
+"""
+Copyright 2024, Zep Software, Inc.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+"""
+
+import os
+from pathlib import Path
+from tempfile import TemporaryDirectory
+
+import pytest
+
+from graphiti_core.config import (
+    DatabaseConfig,
+    EmbedderConfig,
+    EmbedderProvider,
+    GraphitiConfig,
+    LLMProvider,
+    LLMProviderConfig,
+    RerankerConfig,
+)
+from graphiti_core.config.providers import DatabaseProvider, RerankerProvider
+
+
+class TestLLMProviderConfig:
+    def test_openai_defaults(self):
+        """Test OpenAI provider defaults are set correctly."""
+        config = LLMProviderConfig(provider=LLMProvider.OPENAI)
+
+        assert config.provider == LLMProvider.OPENAI
+        assert config.model == 'gpt-4.1-mini'
+        assert config.small_model == 'gpt-4.1-nano'
+        assert config.temperature == 1.0
+        assert config.max_tokens == 8192
+
+    def test_anthropic_defaults(self):
+        """Test Anthropic provider defaults are set correctly."""
+        config = LLMProviderConfig(provider=LLMProvider.ANTHROPIC)
+
+        assert config.provider == LLMProvider.ANTHROPIC
+        assert config.model == 'claude-sonnet-4-5-latest'
+        assert config.small_model == 'claude-haiku-4-5-latest'
+
+    def test_azure_openai_requires_base_url(self):
+        """Test Azure OpenAI provider requires base_url."""
+        with pytest.raises(ValueError, match='base_url is required'):
+            LLMProviderConfig(provider=LLMProvider.AZURE_OPENAI)
+
+    def test_azure_openai_valid_config(self):
+        """Test valid Azure OpenAI configuration."""
+        config = LLMProviderConfig(
+            provider=LLMProvider.AZURE_OPENAI,
+            base_url='https://my-resource.openai.azure.com',
+            azure_deployment='gpt-4-deployment',
+            api_key='test-key',
+        )
+
+        assert config.provider == LLMProvider.AZURE_OPENAI
+        assert config.base_url == 'https://my-resource.openai.azure.com'
+        assert config.azure_deployment == 'gpt-4-deployment'
+
+    def test_litellm_requires_model(self):
+        """Test LiteLLM provider requires litellm_model."""
+        with pytest.raises(ValueError, match='litellm_model is required'):
+            LLMProviderConfig(provider=LLMProvider.LITELLM)
+
+    def test_litellm_valid_config(self):
+        """Test valid LiteLLM configuration."""
+        config = LLMProviderConfig(
+            provider=LLMProvider.LITELLM,
+            litellm_model='azure/gpt-4',
+        )
+
+        assert config.provider == LLMProvider.LITELLM
+        assert config.litellm_model == 'azure/gpt-4'
+
+    def test_custom_provider_requires_client_class(self):
+        """Test custom provider requires custom_client_class."""
+        with pytest.raises(ValueError, match='custom_client_class is required'):
+            LLMProviderConfig(provider=LLMProvider.CUSTOM)
+
+    def test_api_key_from_env(self, monkeypatch):
+        """Test API key is loaded from environment."""
+        monkeypatch.setenv('OPENAI_API_KEY', 'test-api-key')
+
+        config = LLMProviderConfig(provider=LLMProvider.OPENAI)
+
+        assert config.api_key == 'test-api-key'
+
+
+class TestEmbedderConfig:
+    def test_openai_defaults(self):
+        """Test OpenAI embedder defaults."""
+        config = EmbedderConfig(provider=EmbedderProvider.OPENAI)
+
+        assert config.provider == EmbedderProvider.OPENAI
+        assert config.model == 'text-embedding-3-small'
+        assert config.dimensions == 1536
+
+    def test_voyage_defaults(self):
+        """Test Voyage AI embedder defaults."""
+        config = EmbedderConfig(provider=EmbedderProvider.VOYAGE)
+
+        assert config.provider == EmbedderProvider.VOYAGE
+        assert config.model == 'voyage-3'
+        assert config.dimensions == 1024
+
+    def test_azure_requires_base_url(self):
+        """Test Azure embedder requires base_url."""
+        with pytest.raises(ValueError, match='base_url is required'):
+            EmbedderConfig(provider=EmbedderProvider.AZURE_OPENAI)
+
+    def test_custom_embedder_requires_class(self):
+        """Test custom embedder requires custom_client_class."""
+        with pytest.raises(ValueError, match='custom_client_class is required'):
+            EmbedderConfig(provider=EmbedderProvider.CUSTOM)
+
+
+class TestGraphitiConfig:
+    def test_default_config(self):
+        """Test default configuration."""
+        config = GraphitiConfig()
+
+        assert config.llm.provider == LLMProvider.OPENAI
+        assert config.embedder.provider == EmbedderProvider.OPENAI
+        assert config.database.provider == DatabaseProvider.NEO4J
+        assert config.store_raw_episode_content is True
+
+    def test_yaml_round_trip(self):
+        """Test saving and loading configuration from YAML."""
+        with TemporaryDirectory() as tmpdir:
+            config_path = Path(tmpdir) / 'test_config.yaml'
+
+            # Create and save config
+            original_config = GraphitiConfig(
+                llm=LLMProviderConfig(
+                    provider=LLMProvider.ANTHROPIC,
+                    model='claude-sonnet-4-5-latest',
+                    temperature=0.7,
+                ),
+                embedder=EmbedderConfig(
+                    provider=EmbedderProvider.VOYAGE,
+                    model='voyage-3',
+                ),
+                store_raw_episode_content=False,
+            )
+
+            original_config.to_yaml(config_path)
+
+            # Load config back
+            loaded_config = GraphitiConfig.from_yaml(config_path)
+
+            assert loaded_config.llm.provider == LLMProvider.ANTHROPIC
+            assert loaded_config.llm.model == 'claude-sonnet-4-5-latest'
+            assert loaded_config.llm.temperature == 0.7
+            assert loaded_config.embedder.provider == EmbedderProvider.VOYAGE
+            assert loaded_config.embedder.model == 'voyage-3'
+            assert loaded_config.store_raw_episode_content is False
+
+    def test_from_yaml_file_not_found(self):
+        """Test loading from non-existent file raises error."""
+        with pytest.raises(FileNotFoundError):
+            GraphitiConfig.from_yaml('nonexistent.yaml')
+
+    def test_from_env_with_config_path(self, monkeypatch):
+        """Test loading config from environment variable."""
+        with TemporaryDirectory() as tmpdir:
+            config_path = Path(tmpdir) / 'graphiti.yaml'
+
+            # Create config file
+            config = GraphitiConfig(
+                llm=LLMProviderConfig(provider=LLMProvider.GEMINI),
+            )
+            config.to_yaml(config_path)
+
+            # Set environment variable
+            monkeypatch.setenv('GRAPHITI_CONFIG_PATH', str(config_path))
+
+            # Load from environment
+            loaded_config = GraphitiConfig.from_env()
+
+            assert loaded_config.llm.provider == LLMProvider.GEMINI
+
+    def test_from_env_default_files(self):
+        """Test loading from default config files."""
+        with TemporaryDirectory() as tmpdir:
+            config_path = Path(tmpdir) / '.graphiti.yaml'
+
+            # Create config in temp dir
+            config = GraphitiConfig(
+                llm=LLMProviderConfig(provider=LLMProvider.GROQ),
+            )
+            config.to_yaml(config_path)
+
+            # Change to temp dir and load
+            original_dir = os.getcwd()
+            try:
+                os.chdir(tmpdir)
+                loaded_config = GraphitiConfig.from_env()
+                assert loaded_config.llm.provider == LLMProvider.GROQ
+            finally:
+                os.chdir(original_dir)
+
+    def test_from_env_no_config_returns_defaults(self, monkeypatch):
+        """Test loading from environment without config returns defaults."""
+        # Make sure env var is not set
+        monkeypatch.delenv('GRAPHITI_CONFIG_PATH', raising=False)
+
+        config = GraphitiConfig.from_env()
+
+        # Should return default config
+        assert config.llm.provider == LLMProvider.OPENAI
+        assert config.embedder.provider == EmbedderProvider.OPENAI
+
+
+class TestDatabaseConfig:
+    def test_neo4j_config(self):
+        """Test Neo4j database configuration."""
+        config = DatabaseConfig(
+            provider=DatabaseProvider.NEO4J,
+            uri='bolt://localhost:7687',
+            user='neo4j',
+            password='password',
+            database='graphiti',
+        )
+
+        assert config.provider == DatabaseProvider.NEO4J
+        assert config.uri == 'bolt://localhost:7687'
+        assert config.user == 'neo4j'
+        assert config.database == 'graphiti'
+
+    def test_custom_database_requires_driver_class(self):
+        """Test custom database provider requires custom_driver_class."""
+        with pytest.raises(ValueError, match='custom_driver_class is required'):
+            DatabaseConfig(provider=DatabaseProvider.CUSTOM)
+
+
+class TestRerankerConfig:
+    def test_default_config(self):
+        """Test default reranker configuration."""
+        config = RerankerConfig()
+
+        assert config.provider == RerankerProvider.OPENAI
+
+    def test_api_key_from_env(self, monkeypatch):
+        """Test reranker API key from environment."""
+        monkeypatch.setenv('OPENAI_API_KEY', 'test-key')
+
+        config = RerankerConfig(provider=RerankerProvider.OPENAI)
+
+        assert config.api_key == 'test-key'
diff --git a/uv.lock b/uv.lock
index 546537e17..7ef780f73 100644
--- a/uv.lock
+++ b/uv.lock
@@ -1,5 +1,5 @@
 version = 1
-revision = 2
+revision = 3
 requires-python = ">=3.10, <4"
 resolution-markers = [
     "python_full_version >= '3.14'",
@@ -499,6 +499,18 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/20/94/c5790835a017658cbfabd07f3bfb549140c3ac458cfc196323996b10095a/charset_normalizer-3.4.2-py3-none-any.whl", hash = "sha256:7f56930ab0abd1c45cd15be65cc741c28b1c9a34876ce8c17a2fa107810c0af0", size = 52626, upload-time = "2025-05-02T08:34:40.053Z" },
 ]
 
+[[package]]
+name = "click"
+version = "8.3.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "colorama", marker = "sys_platform == 'win32'" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/3d/fa/656b739db8587d7b5dfa22e22ed02566950fbfbcdc20311993483657a5c0/click-8.3.1.tar.gz", hash = "sha256:12ff4785d337a1bb490bb7e9c2b1ee5da3112e94a8622f26a6c77f5d2fc6842a", size = 295065, upload-time = "2025-11-15T20:45:42.706Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/98/78/01c019cdb5d6498122777c1a43056ebb3ebfeef2076d9d026bfe15583b2b/click-8.3.1-py3-none-any.whl", hash = "sha256:981153a64e25f12d547d3426c367a4857371575ee7ad18df2a6183ab0545b2a6", size = 108274, upload-time = "2025-11-15T20:45:41.139Z" },
+]
+
 [[package]]
 name = "colorama"
 version = "0.4.6"
@@ -653,6 +665,69 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/90/2b/0817a2b257fe88725c25589d89aec060581aabf668707a8d03b2e9e0cb2a/fastjsonschema-2.21.1-py3-none-any.whl", hash = "sha256:c9e5b7e908310918cf494a434eeb31384dd84a98b57a30bcb1f535015b554667", size = 23924, upload-time = "2024-12-02T10:55:07.599Z" },
 ]
 
+[[package]]
+name = "fastuuid"
+version = "0.14.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/c3/7d/d9daedf0f2ebcacd20d599928f8913e9d2aea1d56d2d355a93bfa2b611d7/fastuuid-0.14.0.tar.gz", hash = "sha256:178947fc2f995b38497a74172adee64fdeb8b7ec18f2a5934d037641ba265d26", size = 18232, upload-time = "2025-10-19T22:19:22.402Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/ad/b2/731a6696e37cd20eed353f69a09f37a984a43c9713764ee3f7ad5f57f7f9/fastuuid-0.14.0-cp310-cp310-macosx_10_12_x86_64.macosx_11_0_arm64.macosx_10_12_universal2.whl", hash = "sha256:6e6243d40f6c793c3e2ee14c13769e341b90be5ef0c23c82fa6515a96145181a", size = 516760, upload-time = "2025-10-19T22:25:21.509Z" },
+    { url = "https://files.pythonhosted.org/packages/c5/79/c73c47be2a3b8734d16e628982653517f80bbe0570e27185d91af6096507/fastuuid-0.14.0-cp310-cp310-macosx_10_12_x86_64.whl", hash = "sha256:13ec4f2c3b04271f62be2e1ce7e95ad2dd1cf97e94503a3760db739afbd48f00", size = 264748, upload-time = "2025-10-19T22:41:52.873Z" },
+    { url = "https://files.pythonhosted.org/packages/24/c5/84c1eea05977c8ba5173555b0133e3558dc628bcf868d6bf1689ff14aedc/fastuuid-0.14.0-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:b2fdd48b5e4236df145a149d7125badb28e0a383372add3fbaac9a6b7a394470", size = 254537, upload-time = "2025-10-19T22:33:55.603Z" },
+    { url = "https://files.pythonhosted.org/packages/0e/23/4e362367b7fa17dbed646922f216b9921efb486e7abe02147e4b917359f8/fastuuid-0.14.0-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:f74631b8322d2780ebcf2d2d75d58045c3e9378625ec51865fe0b5620800c39d", size = 278994, upload-time = "2025-10-19T22:26:17.631Z" },
+    { url = "https://files.pythonhosted.org/packages/b2/72/3985be633b5a428e9eaec4287ed4b873b7c4c53a9639a8b416637223c4cd/fastuuid-0.14.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:83cffc144dc93eb604b87b179837f2ce2af44871a7b323f2bfed40e8acb40ba8", size = 280003, upload-time = "2025-10-19T22:23:45.415Z" },
+    { url = "https://files.pythonhosted.org/packages/b3/6d/6ef192a6df34e2266d5c9deb39cd3eea986df650cbcfeaf171aa52a059c3/fastuuid-0.14.0-cp310-cp310-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:1a771f135ab4523eb786e95493803942a5d1fc1610915f131b363f55af53b219", size = 303583, upload-time = "2025-10-19T22:26:00.756Z" },
+    { url = "https://files.pythonhosted.org/packages/9d/11/8a2ea753c68d4fece29d5d7c6f3f903948cc6e82d1823bc9f7f7c0355db3/fastuuid-0.14.0-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:4edc56b877d960b4eda2c4232f953a61490c3134da94f3c28af129fb9c62a4f6", size = 460955, upload-time = "2025-10-19T22:36:25.196Z" },
+    { url = "https://files.pythonhosted.org/packages/23/42/7a32c93b6ce12642d9a152ee4753a078f372c9ebb893bc489d838dd4afd5/fastuuid-0.14.0-cp310-cp310-musllinux_1_1_i686.whl", hash = "sha256:bcc96ee819c282e7c09b2eed2b9bd13084e3b749fdb2faf58c318d498df2efbe", size = 480763, upload-time = "2025-10-19T22:24:28.451Z" },
+    { url = "https://files.pythonhosted.org/packages/b9/e9/a5f6f686b46e3ed4ed3b93770111c233baac87dd6586a411b4988018ef1d/fastuuid-0.14.0-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:7a3c0bca61eacc1843ea97b288d6789fbad7400d16db24e36a66c28c268cfe3d", size = 452613, upload-time = "2025-10-19T22:25:06.827Z" },
+    { url = "https://files.pythonhosted.org/packages/b4/c9/18abc73c9c5b7fc0e476c1733b678783b2e8a35b0be9babd423571d44e98/fastuuid-0.14.0-cp310-cp310-win32.whl", hash = "sha256:7f2f3efade4937fae4e77efae1af571902263de7b78a0aee1a1653795a093b2a", size = 155045, upload-time = "2025-10-19T22:28:32.732Z" },
+    { url = "https://files.pythonhosted.org/packages/5e/8a/d9e33f4eb4d4f6d9f2c5c7d7e96b5cdbb535c93f3b1ad6acce97ee9d4bf8/fastuuid-0.14.0-cp310-cp310-win_amd64.whl", hash = "sha256:ae64ba730d179f439b0736208b4c279b8bc9c089b102aec23f86512ea458c8a4", size = 156122, upload-time = "2025-10-19T22:23:15.59Z" },
+    { url = "https://files.pythonhosted.org/packages/98/f3/12481bda4e5b6d3e698fbf525df4443cc7dce746f246b86b6fcb2fba1844/fastuuid-0.14.0-cp311-cp311-macosx_10_12_x86_64.macosx_11_0_arm64.macosx_10_12_universal2.whl", hash = "sha256:73946cb950c8caf65127d4e9a325e2b6be0442a224fd51ba3b6ac44e1912ce34", size = 516386, upload-time = "2025-10-19T22:42:40.176Z" },
+    { url = "https://files.pythonhosted.org/packages/59/19/2fc58a1446e4d72b655648eb0879b04e88ed6fa70d474efcf550f640f6ec/fastuuid-0.14.0-cp311-cp311-macosx_10_12_x86_64.whl", hash = "sha256:12ac85024637586a5b69645e7ed986f7535106ed3013640a393a03e461740cb7", size = 264569, upload-time = "2025-10-19T22:25:50.977Z" },
+    { url = "https://files.pythonhosted.org/packages/78/29/3c74756e5b02c40cfcc8b1d8b5bac4edbd532b55917a6bcc9113550e99d1/fastuuid-0.14.0-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:05a8dde1f395e0c9b4be515b7a521403d1e8349443e7641761af07c7ad1624b1", size = 254366, upload-time = "2025-10-19T22:29:49.166Z" },
+    { url = "https://files.pythonhosted.org/packages/52/96/d761da3fccfa84f0f353ce6e3eb8b7f76b3aa21fd25e1b00a19f9c80a063/fastuuid-0.14.0-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:09378a05020e3e4883dfdab438926f31fea15fd17604908f3d39cbeb22a0b4dc", size = 278978, upload-time = "2025-10-19T22:35:41.306Z" },
+    { url = "https://files.pythonhosted.org/packages/fc/c2/f84c90167cc7765cb82b3ff7808057608b21c14a38531845d933a4637307/fastuuid-0.14.0-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:bbb0c4b15d66b435d2538f3827f05e44e2baafcc003dd7d8472dc67807ab8fd8", size = 279692, upload-time = "2025-10-19T22:25:36.997Z" },
+    { url = "https://files.pythonhosted.org/packages/af/7b/4bacd03897b88c12348e7bd77943bac32ccf80ff98100598fcff74f75f2e/fastuuid-0.14.0-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:cd5a7f648d4365b41dbf0e38fe8da4884e57bed4e77c83598e076ac0c93995e7", size = 303384, upload-time = "2025-10-19T22:29:46.578Z" },
+    { url = "https://files.pythonhosted.org/packages/c0/a2/584f2c29641df8bd810d00c1f21d408c12e9ad0c0dafdb8b7b29e5ddf787/fastuuid-0.14.0-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:c0a94245afae4d7af8c43b3159d5e3934c53f47140be0be624b96acd672ceb73", size = 460921, upload-time = "2025-10-19T22:36:42.006Z" },
+    { url = "https://files.pythonhosted.org/packages/24/68/c6b77443bb7764c760e211002c8638c0c7cce11cb584927e723215ba1398/fastuuid-0.14.0-cp311-cp311-musllinux_1_1_i686.whl", hash = "sha256:2b29e23c97e77c3a9514d70ce343571e469098ac7f5a269320a0f0b3e193ab36", size = 480575, upload-time = "2025-10-19T22:28:18.975Z" },
+    { url = "https://files.pythonhosted.org/packages/5a/87/93f553111b33f9bb83145be12868c3c475bf8ea87c107063d01377cc0e8e/fastuuid-0.14.0-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:1e690d48f923c253f28151b3a6b4e335f2b06bf669c68a02665bc150b7839e94", size = 452317, upload-time = "2025-10-19T22:25:32.75Z" },
+    { url = "https://files.pythonhosted.org/packages/9e/8c/a04d486ca55b5abb7eaa65b39df8d891b7b1635b22db2163734dc273579a/fastuuid-0.14.0-cp311-cp311-win32.whl", hash = "sha256:a6f46790d59ab38c6aa0e35c681c0484b50dc0acf9e2679c005d61e019313c24", size = 154804, upload-time = "2025-10-19T22:24:15.615Z" },
+    { url = "https://files.pythonhosted.org/packages/9c/b2/2d40bf00820de94b9280366a122cbaa60090c8cf59e89ac3938cf5d75895/fastuuid-0.14.0-cp311-cp311-win_amd64.whl", hash = "sha256:e150eab56c95dc9e3fefc234a0eedb342fac433dacc273cd4d150a5b0871e1fa", size = 156099, upload-time = "2025-10-19T22:24:31.646Z" },
+    { url = "https://files.pythonhosted.org/packages/02/a2/e78fcc5df65467f0d207661b7ef86c5b7ac62eea337c0c0fcedbeee6fb13/fastuuid-0.14.0-cp312-cp312-macosx_10_12_x86_64.macosx_11_0_arm64.macosx_10_12_universal2.whl", hash = "sha256:77e94728324b63660ebf8adb27055e92d2e4611645bf12ed9d88d30486471d0a", size = 510164, upload-time = "2025-10-19T22:31:45.635Z" },
+    { url = "https://files.pythonhosted.org/packages/2b/b3/c846f933f22f581f558ee63f81f29fa924acd971ce903dab1a9b6701816e/fastuuid-0.14.0-cp312-cp312-macosx_10_12_x86_64.whl", hash = "sha256:caa1f14d2102cb8d353096bc6ef6c13b2c81f347e6ab9d6fbd48b9dea41c153d", size = 261837, upload-time = "2025-10-19T22:38:38.53Z" },
+    { url = "https://files.pythonhosted.org/packages/54/ea/682551030f8c4fa9a769d9825570ad28c0c71e30cf34020b85c1f7ee7382/fastuuid-0.14.0-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:d23ef06f9e67163be38cece704170486715b177f6baae338110983f99a72c070", size = 251370, upload-time = "2025-10-19T22:40:26.07Z" },
+    { url = "https://files.pythonhosted.org/packages/14/dd/5927f0a523d8e6a76b70968e6004966ee7df30322f5fc9b6cdfb0276646a/fastuuid-0.14.0-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:0c9ec605ace243b6dbe3bd27ebdd5d33b00d8d1d3f580b39fdd15cd96fd71796", size = 277766, upload-time = "2025-10-19T22:37:23.779Z" },
+    { url = "https://files.pythonhosted.org/packages/16/6e/c0fb547eef61293153348f12e0f75a06abb322664b34a1573a7760501336/fastuuid-0.14.0-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:808527f2407f58a76c916d6aa15d58692a4a019fdf8d4c32ac7ff303b7d7af09", size = 278105, upload-time = "2025-10-19T22:26:56.821Z" },
+    { url = "https://files.pythonhosted.org/packages/2d/b1/b9c75e03b768f61cf2e84ee193dc18601aeaf89a4684b20f2f0e9f52b62c/fastuuid-0.14.0-cp312-cp312-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:2fb3c0d7fef6674bbeacdd6dbd386924a7b60b26de849266d1ff6602937675c8", size = 301564, upload-time = "2025-10-19T22:30:31.604Z" },
+    { url = "https://files.pythonhosted.org/packages/fc/fa/f7395fdac07c7a54f18f801744573707321ca0cee082e638e36452355a9d/fastuuid-0.14.0-cp312-cp312-musllinux_1_1_aarch64.whl", hash = "sha256:ab3f5d36e4393e628a4df337c2c039069344db5f4b9d2a3c9cea48284f1dd741", size = 459659, upload-time = "2025-10-19T22:31:32.341Z" },
+    { url = "https://files.pythonhosted.org/packages/66/49/c9fd06a4a0b1f0f048aacb6599e7d96e5d6bc6fa680ed0d46bf111929d1b/fastuuid-0.14.0-cp312-cp312-musllinux_1_1_i686.whl", hash = "sha256:b9a0ca4f03b7e0b01425281ffd44e99d360e15c895f1907ca105854ed85e2057", size = 478430, upload-time = "2025-10-19T22:26:22.962Z" },
+    { url = "https://files.pythonhosted.org/packages/be/9c/909e8c95b494e8e140e8be6165d5fc3f61fdc46198c1554df7b3e1764471/fastuuid-0.14.0-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:3acdf655684cc09e60fb7e4cf524e8f42ea760031945aa8086c7eae2eeeabeb8", size = 450894, upload-time = "2025-10-19T22:27:01.647Z" },
+    { url = "https://files.pythonhosted.org/packages/90/eb/d29d17521976e673c55ef7f210d4cdd72091a9ec6755d0fd4710d9b3c871/fastuuid-0.14.0-cp312-cp312-win32.whl", hash = "sha256:9579618be6280700ae36ac42c3efd157049fe4dd40ca49b021280481c78c3176", size = 154374, upload-time = "2025-10-19T22:29:19.879Z" },
+    { url = "https://files.pythonhosted.org/packages/cc/fc/f5c799a6ea6d877faec0472d0b27c079b47c86b1cdc577720a5386483b36/fastuuid-0.14.0-cp312-cp312-win_amd64.whl", hash = "sha256:d9e4332dc4ba054434a9594cbfaf7823b57993d7d8e7267831c3e059857cf397", size = 156550, upload-time = "2025-10-19T22:27:49.658Z" },
+    { url = "https://files.pythonhosted.org/packages/a5/83/ae12dd39b9a39b55d7f90abb8971f1a5f3c321fd72d5aa83f90dc67fe9ed/fastuuid-0.14.0-cp313-cp313-macosx_10_12_x86_64.macosx_11_0_arm64.macosx_10_12_universal2.whl", hash = "sha256:77a09cb7427e7af74c594e409f7731a0cf887221de2f698e1ca0ebf0f3139021", size = 510720, upload-time = "2025-10-19T22:42:34.633Z" },
+    { url = "https://files.pythonhosted.org/packages/53/b0/a4b03ff5d00f563cc7546b933c28cb3f2a07344b2aec5834e874f7d44143/fastuuid-0.14.0-cp313-cp313-macosx_10_12_x86_64.whl", hash = "sha256:9bd57289daf7b153bfa3e8013446aa144ce5e8c825e9e366d455155ede5ea2dc", size = 262024, upload-time = "2025-10-19T22:30:25.482Z" },
+    { url = "https://files.pythonhosted.org/packages/9c/6d/64aee0a0f6a58eeabadd582e55d0d7d70258ffdd01d093b30c53d668303b/fastuuid-0.14.0-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:ac60fc860cdf3c3f327374db87ab8e064c86566ca8c49d2e30df15eda1b0c2d5", size = 251679, upload-time = "2025-10-19T22:36:14.096Z" },
+    { url = "https://files.pythonhosted.org/packages/60/f5/a7e9cda8369e4f7919d36552db9b2ae21db7915083bc6336f1b0082c8b2e/fastuuid-0.14.0-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ab32f74bd56565b186f036e33129da77db8be09178cd2f5206a5d4035fb2a23f", size = 277862, upload-time = "2025-10-19T22:36:23.302Z" },
+    { url = "https://files.pythonhosted.org/packages/f0/d3/8ce11827c783affffd5bd4d6378b28eb6cc6d2ddf41474006b8d62e7448e/fastuuid-0.14.0-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:33e678459cf4addaedd9936bbb038e35b3f6b2061330fd8f2f6a1d80414c0f87", size = 278278, upload-time = "2025-10-19T22:29:43.809Z" },
+    { url = "https://files.pythonhosted.org/packages/a2/51/680fb6352d0bbade04036da46264a8001f74b7484e2fd1f4da9e3db1c666/fastuuid-0.14.0-cp313-cp313-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:1e3cc56742f76cd25ecb98e4b82a25f978ccffba02e4bdce8aba857b6d85d87b", size = 301788, upload-time = "2025-10-19T22:36:06.825Z" },
+    { url = "https://files.pythonhosted.org/packages/fa/7c/2014b5785bd8ebdab04ec857635ebd84d5ee4950186a577db9eff0fb8ff6/fastuuid-0.14.0-cp313-cp313-musllinux_1_1_aarch64.whl", hash = "sha256:cb9a030f609194b679e1660f7e32733b7a0f332d519c5d5a6a0a580991290022", size = 459819, upload-time = "2025-10-19T22:35:31.623Z" },
+    { url = "https://files.pythonhosted.org/packages/01/d2/524d4ceeba9160e7a9bc2ea3e8f4ccf1ad78f3bde34090ca0c51f09a5e91/fastuuid-0.14.0-cp313-cp313-musllinux_1_1_i686.whl", hash = "sha256:09098762aad4f8da3a888eb9ae01c84430c907a297b97166b8abc07b640f2995", size = 478546, upload-time = "2025-10-19T22:26:03.023Z" },
+    { url = "https://files.pythonhosted.org/packages/bc/17/354d04951ce114bf4afc78e27a18cfbd6ee319ab1829c2d5fb5e94063ac6/fastuuid-0.14.0-cp313-cp313-musllinux_1_1_x86_64.whl", hash = "sha256:1383fff584fa249b16329a059c68ad45d030d5a4b70fb7c73a08d98fd53bcdab", size = 450921, upload-time = "2025-10-19T22:31:02.151Z" },
+    { url = "https://files.pythonhosted.org/packages/fb/be/d7be8670151d16d88f15bb121c5b66cdb5ea6a0c2a362d0dcf30276ade53/fastuuid-0.14.0-cp313-cp313-win32.whl", hash = "sha256:a0809f8cc5731c066c909047f9a314d5f536c871a7a22e815cc4967c110ac9ad", size = 154559, upload-time = "2025-10-19T22:36:36.011Z" },
+    { url = "https://files.pythonhosted.org/packages/22/1d/5573ef3624ceb7abf4a46073d3554e37191c868abc3aecd5289a72f9810a/fastuuid-0.14.0-cp313-cp313-win_amd64.whl", hash = "sha256:0df14e92e7ad3276327631c9e7cec09e32572ce82089c55cb1bb8df71cf394ed", size = 156539, upload-time = "2025-10-19T22:33:35.898Z" },
+    { url = "https://files.pythonhosted.org/packages/16/c9/8c7660d1fe3862e3f8acabd9be7fc9ad71eb270f1c65cce9a2b7a31329ab/fastuuid-0.14.0-cp314-cp314-macosx_10_12_x86_64.macosx_11_0_arm64.macosx_10_12_universal2.whl", hash = "sha256:b852a870a61cfc26c884af205d502881a2e59cc07076b60ab4a951cc0c94d1ad", size = 510600, upload-time = "2025-10-19T22:43:44.17Z" },
+    { url = "https://files.pythonhosted.org/packages/4c/f4/a989c82f9a90d0ad995aa957b3e572ebef163c5299823b4027986f133dfb/fastuuid-0.14.0-cp314-cp314-macosx_10_12_x86_64.whl", hash = "sha256:c7502d6f54cd08024c3ea9b3514e2d6f190feb2f46e6dbcd3747882264bb5f7b", size = 262069, upload-time = "2025-10-19T22:43:38.38Z" },
+    { url = "https://files.pythonhosted.org/packages/da/6c/a1a24f73574ac995482b1326cf7ab41301af0fabaa3e37eeb6b3df00e6e2/fastuuid-0.14.0-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:1ca61b592120cf314cfd66e662a5b54a578c5a15b26305e1b8b618a6f22df714", size = 251543, upload-time = "2025-10-19T22:32:22.537Z" },
+    { url = "https://files.pythonhosted.org/packages/1a/20/2a9b59185ba7a6c7b37808431477c2d739fcbdabbf63e00243e37bd6bf49/fastuuid-0.14.0-cp314-cp314-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:aa75b6657ec129d0abded3bec745e6f7ab642e6dba3a5272a68247e85f5f316f", size = 277798, upload-time = "2025-10-19T22:33:53.821Z" },
+    { url = "https://files.pythonhosted.org/packages/ef/33/4105ca574f6ded0af6a797d39add041bcfb468a1255fbbe82fcb6f592da2/fastuuid-0.14.0-cp314-cp314-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:a8a0dfea3972200f72d4c7df02c8ac70bad1bb4c58d7e0ec1e6f341679073a7f", size = 278283, upload-time = "2025-10-19T22:29:02.812Z" },
+    { url = "https://files.pythonhosted.org/packages/fe/8c/fca59f8e21c4deb013f574eae05723737ddb1d2937ce87cb2a5d20992dc3/fastuuid-0.14.0-cp314-cp314-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:1bf539a7a95f35b419f9ad105d5a8a35036df35fdafae48fb2fd2e5f318f0d75", size = 301627, upload-time = "2025-10-19T22:35:54.985Z" },
+    { url = "https://files.pythonhosted.org/packages/cb/e2/f78c271b909c034d429218f2798ca4e89eeda7983f4257d7865976ddbb6c/fastuuid-0.14.0-cp314-cp314-musllinux_1_1_aarch64.whl", hash = "sha256:9a133bf9cc78fdbd1179cb58a59ad0100aa32d8675508150f3658814aeefeaa4", size = 459778, upload-time = "2025-10-19T22:28:00.999Z" },
+    { url = "https://files.pythonhosted.org/packages/1e/f0/5ff209d865897667a2ff3e7a572267a9ced8f7313919f6d6043aed8b1caa/fastuuid-0.14.0-cp314-cp314-musllinux_1_1_i686.whl", hash = "sha256:f54d5b36c56a2d5e1a31e73b950b28a0d83eb0c37b91d10408875a5a29494bad", size = 478605, upload-time = "2025-10-19T22:36:21.764Z" },
+    { url = "https://files.pythonhosted.org/packages/e0/c8/2ce1c78f983a2c4987ea865d9516dbdfb141a120fd3abb977ae6f02ba7ca/fastuuid-0.14.0-cp314-cp314-musllinux_1_1_x86_64.whl", hash = "sha256:ec27778c6ca3393ef662e2762dba8af13f4ec1aaa32d08d77f71f2a70ae9feb8", size = 450837, upload-time = "2025-10-19T22:34:37.178Z" },
+    { url = "https://files.pythonhosted.org/packages/df/60/dad662ec9a33b4a5fe44f60699258da64172c39bd041da2994422cdc40fe/fastuuid-0.14.0-cp314-cp314-win32.whl", hash = "sha256:e23fc6a83f112de4be0cc1990e5b127c27663ae43f866353166f87df58e73d06", size = 154532, upload-time = "2025-10-19T22:35:18.217Z" },
+    { url = "https://files.pythonhosted.org/packages/1f/f6/da4db31001e854025ffd26bc9ba0740a9cbba2c3259695f7c5834908b336/fastuuid-0.14.0-cp314-cp314-win_amd64.whl", hash = "sha256:df61342889d0f5e7a32f7284e55ef95103f2110fee433c2ae7c2c0956d76ac8a", size = 156457, upload-time = "2025-10-19T22:33:44.579Z" },
+]
+
 [[package]]
 name = "filelock"
 version = "3.18.0"
@@ -819,6 +894,7 @@ dependencies = [
     { name = "posthog" },
     { name = "pydantic" },
     { name = "python-dotenv" },
+    { name = "pyyaml" },
     { name = "tenacity" },
 ]
 
@@ -864,6 +940,9 @@ groq = [
 kuzu = [
     { name = "kuzu" },
 ]
+litellm = [
+    { name = "litellm" },
+]
 neo4j-opensearch = [
     { name = "boto3" },
     { name = "opensearch-py" },
@@ -909,6 +988,7 @@ requires-dist = [
     { name = "langchain-openai", marker = "extra == 'dev'", specifier = ">=0.2.6" },
     { name = "langgraph", marker = "extra == 'dev'", specifier = ">=0.2.15" },
     { name = "langsmith", marker = "extra == 'dev'", specifier = ">=0.1.108" },
+    { name = "litellm", marker = "extra == 'litellm'", specifier = ">=1.52.0" },
     { name = "neo4j", specifier = ">=5.26.0" },
     { name = "numpy", specifier = ">=1.0.0" },
     { name = "openai", specifier = ">=1.91.0" },
@@ -925,6 +1005,7 @@ requires-dist = [
     { name = "pytest-asyncio", marker = "extra == 'dev'", specifier = ">=0.24.0" },
     { name = "pytest-xdist", marker = "extra == 'dev'", specifier = ">=3.6.1" },
     { name = "python-dotenv", specifier = ">=1.0.1" },
+    { name = "pyyaml", specifier = ">=6.0.0" },
     { name = "ruff", marker = "extra == 'dev'", specifier = ">=0.7.1" },
     { name = "sentence-transformers", marker = "extra == 'dev'", specifier = ">=3.2.1" },
     { name = "sentence-transformers", marker = "extra == 'sentence-transformers'", specifier = ">=3.2.1" },
@@ -933,7 +1014,7 @@ requires-dist = [
     { name = "voyageai", marker = "extra == 'dev'", specifier = ">=0.2.3" },
     { name = "voyageai", marker = "extra == 'voyageai'", specifier = ">=0.2.3" },
 ]
-provides-extras = ["anthropic", "groq", "google-genai", "kuzu", "falkordb", "voyageai", "neo4j-opensearch", "sentence-transformers", "neptune", "tracing", "dev"]
+provides-extras = ["anthropic", "groq", "google-genai", "kuzu", "falkordb", "voyageai", "neo4j-opensearch", "sentence-transformers", "neptune", "tracing", "litellm", "dev"]
 
 [[package]]
 name = "groq"
@@ -952,6 +1033,50 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/a2/0b/ef7a92ec5ec23a7012975ed59ca3cef541d50a9f0d2dea947fe2723d011f/groq-0.29.0-py3-none-any.whl", hash = "sha256:03515ec46be1ef1feef0cd9d876b6f30a39ee2742e76516153d84acd7c97f23a", size = 130814, upload-time = "2025-06-25T23:40:10.391Z" },
 ]
 
+[[package]]
+name = "grpcio"
+version = "1.67.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/20/53/d9282a66a5db45981499190b77790570617a604a38f3d103d0400974aeb5/grpcio-1.67.1.tar.gz", hash = "sha256:3dc2ed4cabea4dc14d5e708c2b426205956077cc5de419b4d4079315017e9732", size = 12580022, upload-time = "2024-10-29T06:30:07.787Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/4e/cd/f6ca5c49aa0ae7bc6d0757f7dae6f789569e9490a635eaabe02bc02de7dc/grpcio-1.67.1-cp310-cp310-linux_armv7l.whl", hash = "sha256:8b0341d66a57f8a3119b77ab32207072be60c9bf79760fa609c5609f2deb1f3f", size = 5112450, upload-time = "2024-10-29T06:23:38.202Z" },
+    { url = "https://files.pythonhosted.org/packages/d4/f0/d9bbb4a83cbee22f738ee7a74aa41e09ccfb2dcea2cc30ebe8dab5b21771/grpcio-1.67.1-cp310-cp310-macosx_12_0_universal2.whl", hash = "sha256:f5a27dddefe0e2357d3e617b9079b4bfdc91341a91565111a21ed6ebbc51b22d", size = 10937518, upload-time = "2024-10-29T06:23:43.535Z" },
+    { url = "https://files.pythonhosted.org/packages/5b/17/0c5dbae3af548eb76669887642b5f24b232b021afe77eb42e22bc8951d9c/grpcio-1.67.1-cp310-cp310-manylinux_2_17_aarch64.whl", hash = "sha256:43112046864317498a33bdc4797ae6a268c36345a910de9b9c17159d8346602f", size = 5633610, upload-time = "2024-10-29T06:23:47.168Z" },
+    { url = "https://files.pythonhosted.org/packages/17/48/e000614e00153d7b2760dcd9526b95d72f5cfe473b988e78f0ff3b472f6c/grpcio-1.67.1-cp310-cp310-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:c9b929f13677b10f63124c1a410994a401cdd85214ad83ab67cc077fc7e480f0", size = 6240678, upload-time = "2024-10-29T06:23:49.352Z" },
+    { url = "https://files.pythonhosted.org/packages/64/19/a16762a70eeb8ddfe43283ce434d1499c1c409ceec0c646f783883084478/grpcio-1.67.1-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:e7d1797a8a3845437d327145959a2c0c47c05947c9eef5ff1a4c80e499dcc6fa", size = 5884528, upload-time = "2024-10-29T06:23:52.345Z" },
+    { url = "https://files.pythonhosted.org/packages/6b/dc/bd016aa3684914acd2c0c7fa4953b2a11583c2b844f3d7bae91fa9b98fbb/grpcio-1.67.1-cp310-cp310-musllinux_1_1_i686.whl", hash = "sha256:0489063974d1452436139501bf6b180f63d4977223ee87488fe36858c5725292", size = 6583680, upload-time = "2024-10-29T06:23:55.074Z" },
+    { url = "https://files.pythonhosted.org/packages/1a/93/1441cb14c874f11aa798a816d582f9da82194b6677f0f134ea53d2d5dbeb/grpcio-1.67.1-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:9fd042de4a82e3e7aca44008ee2fb5da01b3e5adb316348c21980f7f58adc311", size = 6162967, upload-time = "2024-10-29T06:23:57.286Z" },
+    { url = "https://files.pythonhosted.org/packages/29/e9/9295090380fb4339b7e935b9d005fa9936dd573a22d147c9e5bb2df1b8d4/grpcio-1.67.1-cp310-cp310-win32.whl", hash = "sha256:638354e698fd0c6c76b04540a850bf1db27b4d2515a19fcd5cf645c48d3eb1ed", size = 3616336, upload-time = "2024-10-29T06:23:59.69Z" },
+    { url = "https://files.pythonhosted.org/packages/ce/de/7c783b8cb8f02c667ca075c49680c4aeb8b054bc69784bcb3e7c1bbf4985/grpcio-1.67.1-cp310-cp310-win_amd64.whl", hash = "sha256:608d87d1bdabf9e2868b12338cd38a79969eaf920c89d698ead08f48de9c0f9e", size = 4352071, upload-time = "2024-10-29T06:24:02.477Z" },
+    { url = "https://files.pythonhosted.org/packages/59/2c/b60d6ea1f63a20a8d09c6db95c4f9a16497913fb3048ce0990ed81aeeca0/grpcio-1.67.1-cp311-cp311-linux_armv7l.whl", hash = "sha256:7818c0454027ae3384235a65210bbf5464bd715450e30a3d40385453a85a70cb", size = 5119075, upload-time = "2024-10-29T06:24:04.696Z" },
+    { url = "https://files.pythonhosted.org/packages/b3/9a/e1956f7ca582a22dd1f17b9e26fcb8229051b0ce6d33b47227824772feec/grpcio-1.67.1-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:ea33986b70f83844cd00814cee4451055cd8cab36f00ac64a31f5bb09b31919e", size = 11009159, upload-time = "2024-10-29T06:24:07.781Z" },
+    { url = "https://files.pythonhosted.org/packages/43/a8/35fbbba580c4adb1d40d12e244cf9f7c74a379073c0a0ca9d1b5338675a1/grpcio-1.67.1-cp311-cp311-manylinux_2_17_aarch64.whl", hash = "sha256:c7a01337407dd89005527623a4a72c5c8e2894d22bead0895306b23c6695698f", size = 5629476, upload-time = "2024-10-29T06:24:11.444Z" },
+    { url = "https://files.pythonhosted.org/packages/77/c9/864d336e167263d14dfccb4dbfa7fce634d45775609895287189a03f1fc3/grpcio-1.67.1-cp311-cp311-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:80b866f73224b0634f4312a4674c1be21b2b4afa73cb20953cbbb73a6b36c3cc", size = 6239901, upload-time = "2024-10-29T06:24:14.2Z" },
+    { url = "https://files.pythonhosted.org/packages/f7/1e/0011408ebabf9bd69f4f87cc1515cbfe2094e5a32316f8714a75fd8ddfcb/grpcio-1.67.1-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:f9fff78ba10d4250bfc07a01bd6254a6d87dc67f9627adece85c0b2ed754fa96", size = 5881010, upload-time = "2024-10-29T06:24:17.451Z" },
+    { url = "https://files.pythonhosted.org/packages/b4/7d/fbca85ee9123fb296d4eff8df566f458d738186d0067dec6f0aa2fd79d71/grpcio-1.67.1-cp311-cp311-musllinux_1_1_i686.whl", hash = "sha256:8a23cbcc5bb11ea7dc6163078be36c065db68d915c24f5faa4f872c573bb400f", size = 6580706, upload-time = "2024-10-29T06:24:20.038Z" },
+    { url = "https://files.pythonhosted.org/packages/75/7a/766149dcfa2dfa81835bf7df623944c1f636a15fcb9b6138ebe29baf0bc6/grpcio-1.67.1-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:1a65b503d008f066e994f34f456e0647e5ceb34cfcec5ad180b1b44020ad4970", size = 6161799, upload-time = "2024-10-29T06:24:22.604Z" },
+    { url = "https://files.pythonhosted.org/packages/09/13/5b75ae88810aaea19e846f5380611837de411181df51fd7a7d10cb178dcb/grpcio-1.67.1-cp311-cp311-win32.whl", hash = "sha256:e29ca27bec8e163dca0c98084040edec3bc49afd10f18b412f483cc68c712744", size = 3616330, upload-time = "2024-10-29T06:24:25.775Z" },
+    { url = "https://files.pythonhosted.org/packages/aa/39/38117259613f68f072778c9638a61579c0cfa5678c2558706b10dd1d11d3/grpcio-1.67.1-cp311-cp311-win_amd64.whl", hash = "sha256:786a5b18544622bfb1e25cc08402bd44ea83edfb04b93798d85dca4d1a0b5be5", size = 4354535, upload-time = "2024-10-29T06:24:28.614Z" },
+    { url = "https://files.pythonhosted.org/packages/6e/25/6f95bd18d5f506364379eabc0d5874873cc7dbdaf0757df8d1e82bc07a88/grpcio-1.67.1-cp312-cp312-linux_armv7l.whl", hash = "sha256:267d1745894200e4c604958da5f856da6293f063327cb049a51fe67348e4f953", size = 5089809, upload-time = "2024-10-29T06:24:31.24Z" },
+    { url = "https://files.pythonhosted.org/packages/10/3f/d79e32e5d0354be33a12db2267c66d3cfeff700dd5ccdd09fd44a3ff4fb6/grpcio-1.67.1-cp312-cp312-macosx_10_9_universal2.whl", hash = "sha256:85f69fdc1d28ce7cff8de3f9c67db2b0ca9ba4449644488c1e0303c146135ddb", size = 10981985, upload-time = "2024-10-29T06:24:34.942Z" },
+    { url = "https://files.pythonhosted.org/packages/21/f2/36fbc14b3542e3a1c20fb98bd60c4732c55a44e374a4eb68f91f28f14aab/grpcio-1.67.1-cp312-cp312-manylinux_2_17_aarch64.whl", hash = "sha256:f26b0b547eb8d00e195274cdfc63ce64c8fc2d3e2d00b12bf468ece41a0423a0", size = 5588770, upload-time = "2024-10-29T06:24:38.145Z" },
+    { url = "https://files.pythonhosted.org/packages/0d/af/bbc1305df60c4e65de8c12820a942b5e37f9cf684ef5e49a63fbb1476a73/grpcio-1.67.1-cp312-cp312-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:4422581cdc628f77302270ff839a44f4c24fdc57887dc2a45b7e53d8fc2376af", size = 6214476, upload-time = "2024-10-29T06:24:41.006Z" },
+    { url = "https://files.pythonhosted.org/packages/92/cf/1d4c3e93efa93223e06a5c83ac27e32935f998bc368e276ef858b8883154/grpcio-1.67.1-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:1d7616d2ded471231c701489190379e0c311ee0a6c756f3c03e6a62b95a7146e", size = 5850129, upload-time = "2024-10-29T06:24:43.553Z" },
+    { url = "https://files.pythonhosted.org/packages/ae/ca/26195b66cb253ac4d5ef59846e354d335c9581dba891624011da0e95d67b/grpcio-1.67.1-cp312-cp312-musllinux_1_1_i686.whl", hash = "sha256:8a00efecde9d6fcc3ab00c13f816313c040a28450e5e25739c24f432fc6d3c75", size = 6568489, upload-time = "2024-10-29T06:24:46.453Z" },
+    { url = "https://files.pythonhosted.org/packages/d1/94/16550ad6b3f13b96f0856ee5dfc2554efac28539ee84a51d7b14526da985/grpcio-1.67.1-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:699e964923b70f3101393710793289e42845791ea07565654ada0969522d0a38", size = 6149369, upload-time = "2024-10-29T06:24:49.112Z" },
+    { url = "https://files.pythonhosted.org/packages/33/0d/4c3b2587e8ad7f121b597329e6c2620374fccbc2e4e1aa3c73ccc670fde4/grpcio-1.67.1-cp312-cp312-win32.whl", hash = "sha256:4e7b904484a634a0fff132958dabdb10d63e0927398273917da3ee103e8d1f78", size = 3599176, upload-time = "2024-10-29T06:24:51.443Z" },
+    { url = "https://files.pythonhosted.org/packages/7d/36/0c03e2d80db69e2472cf81c6123aa7d14741de7cf790117291a703ae6ae1/grpcio-1.67.1-cp312-cp312-win_amd64.whl", hash = "sha256:5721e66a594a6c4204458004852719b38f3d5522082be9061d6510b455c90afc", size = 4346574, upload-time = "2024-10-29T06:24:54.587Z" },
+    { url = "https://files.pythonhosted.org/packages/12/d2/2f032b7a153c7723ea3dea08bffa4bcaca9e0e5bdf643ce565b76da87461/grpcio-1.67.1-cp313-cp313-linux_armv7l.whl", hash = "sha256:aa0162e56fd10a5547fac8774c4899fc3e18c1aa4a4759d0ce2cd00d3696ea6b", size = 5091487, upload-time = "2024-10-29T06:24:57.416Z" },
+    { url = "https://files.pythonhosted.org/packages/d0/ae/ea2ff6bd2475a082eb97db1104a903cf5fc57c88c87c10b3c3f41a184fc0/grpcio-1.67.1-cp313-cp313-macosx_10_13_universal2.whl", hash = "sha256:beee96c8c0b1a75d556fe57b92b58b4347c77a65781ee2ac749d550f2a365dc1", size = 10943530, upload-time = "2024-10-29T06:25:01.062Z" },
+    { url = "https://files.pythonhosted.org/packages/07/62/646be83d1a78edf8d69b56647327c9afc223e3140a744c59b25fbb279c3b/grpcio-1.67.1-cp313-cp313-manylinux_2_17_aarch64.whl", hash = "sha256:a93deda571a1bf94ec1f6fcda2872dad3ae538700d94dc283c672a3b508ba3af", size = 5589079, upload-time = "2024-10-29T06:25:04.254Z" },
+    { url = "https://files.pythonhosted.org/packages/d0/25/71513d0a1b2072ce80d7f5909a93596b7ed10348b2ea4fdcbad23f6017bf/grpcio-1.67.1-cp313-cp313-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:0e6f255980afef598a9e64a24efce87b625e3e3c80a45162d111a461a9f92955", size = 6213542, upload-time = "2024-10-29T06:25:06.824Z" },
+    { url = "https://files.pythonhosted.org/packages/76/9a/d21236297111052dcb5dc85cd77dc7bf25ba67a0f55ae028b2af19a704bc/grpcio-1.67.1-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:9e838cad2176ebd5d4a8bb03955138d6589ce9e2ce5d51c3ada34396dbd2dba8", size = 5850211, upload-time = "2024-10-29T06:25:10.149Z" },
+    { url = "https://files.pythonhosted.org/packages/2d/fe/70b1da9037f5055be14f359026c238821b9bcf6ca38a8d760f59a589aacd/grpcio-1.67.1-cp313-cp313-musllinux_1_1_i686.whl", hash = "sha256:a6703916c43b1d468d0756c8077b12017a9fcb6a1ef13faf49e67d20d7ebda62", size = 6572129, upload-time = "2024-10-29T06:25:12.853Z" },
+    { url = "https://files.pythonhosted.org/packages/74/0d/7df509a2cd2a54814598caf2fb759f3e0b93764431ff410f2175a6efb9e4/grpcio-1.67.1-cp313-cp313-musllinux_1_1_x86_64.whl", hash = "sha256:917e8d8994eed1d86b907ba2a61b9f0aef27a2155bca6cbb322430fc7135b7bb", size = 6149819, upload-time = "2024-10-29T06:25:15.803Z" },
+    { url = "https://files.pythonhosted.org/packages/0a/08/bc3b0155600898fd10f16b79054e1cca6cb644fa3c250c0fe59385df5e6f/grpcio-1.67.1-cp313-cp313-win32.whl", hash = "sha256:e279330bef1744040db8fc432becc8a727b84f456ab62b744d3fdb83f327e121", size = 3596561, upload-time = "2024-10-29T06:25:19.348Z" },
+    { url = "https://files.pythonhosted.org/packages/5a/96/44759eca966720d0f3e1b105c43f8ad4590c97bf8eb3cd489656e9590baa/grpcio-1.67.1-cp313-cp313-win_amd64.whl", hash = "sha256:fa0c739ad8b1996bd24823950e3cb5152ae91fca1c09cc791190bf1627ffefba", size = 4346042, upload-time = "2024-10-29T06:25:21.939Z" },
+]
+
 [[package]]
 name = "h11"
 version = "0.16.0"
@@ -1516,7 +1641,7 @@ wheels = [
 
 [[package]]
 name = "langchain-core"
-version = "0.3.72"
+version = "0.3.80"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "jsonpatch" },
@@ -1527,23 +1652,23 @@ dependencies = [
     { name = "tenacity" },
     { name = "typing-extensions" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/8b/49/7568baeb96a57d3218cb5f1f113b142063679088fd3a0d0cae1feb0b3d36/langchain_core-0.3.72.tar.gz", hash = "sha256:4de3828909b3d7910c313242ab07b241294650f5cb6eac17738dd3638b1cd7de", size = 567227, upload-time = "2025-07-24T00:40:08.5Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/49/49/f76647b7ba1a6f9c11b0343056ab4d3e5fc445981d205237fed882b2ad60/langchain_core-0.3.80.tar.gz", hash = "sha256:29636b82513ab49e834764d023c4d18554d3d719a185d37b019d0a8ae948c6bb", size = 583629, upload-time = "2025-11-19T22:23:18.771Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/6e/7d/9f75023c478e3b854d67da31d721e39f0eb30ae969ec6e755430cb1c0fb5/langchain_core-0.3.72-py3-none-any.whl", hash = "sha256:9fa15d390600eb6b6544397a7aa84be9564939b6adf7a2b091179ea30405b240", size = 442806, upload-time = "2025-07-24T00:40:06.994Z" },
+    { url = "https://files.pythonhosted.org/packages/da/e8/e7a090ebe37f2b071c64e81b99fb1273b3151ae932f560bb94c22f191cde/langchain_core-0.3.80-py3-none-any.whl", hash = "sha256:2141e3838d100d17dce2359f561ec0df52c526bae0de6d4f469f8026c5747456", size = 450786, upload-time = "2025-11-19T22:23:17.133Z" },
 ]
 
 [[package]]
 name = "langchain-openai"
-version = "0.3.27"
+version = "0.3.35"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "langchain-core" },
     { name = "openai" },
     { name = "tiktoken" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/6f/7b/e65261a08a03dd43f0ef8a539930b56548ac8136e71258c220d3589d1d07/langchain_openai-0.3.27.tar.gz", hash = "sha256:5d5a55adbff739274dfc3a4102925771736f893758f63679b64ae62fed79ca30", size = 753326, upload-time = "2025-06-27T17:56:29.904Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/fb/96/06d0d25a37e05a0ff2d918f0a4b0bf0732aed6a43b472b0b68426ce04ef8/langchain_openai-0.3.35.tar.gz", hash = "sha256:fa985fd041c3809da256a040c98e8a43e91c6d165b96dcfeb770d8bd457bf76f", size = 786635, upload-time = "2025-10-06T15:09:28.463Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/aa/31/1f0baf6490b082bf4d06f355c5e9c28728931dbf321f3ca03137617a692e/langchain_openai-0.3.27-py3-none-any.whl", hash = "sha256:efe636c3523978c44adc41cf55c8b3766c05c77547982465884d1258afe705df", size = 70368, upload-time = "2025-06-27T17:56:28.726Z" },
+    { url = "https://files.pythonhosted.org/packages/d8/d5/c90c5478215c20ee71d8feaf676f7ffd78d0568f8c98bd83f81ce7562ed7/langchain_openai-0.3.35-py3-none-any.whl", hash = "sha256:76d5707e6e81fd461d33964ad618bd326cb661a1975cef7c1cb0703576bdada5", size = 75952, upload-time = "2025-10-06T15:09:27.137Z" },
 ]
 
 [[package]]
@@ -1620,6 +1745,30 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/1d/33/a3337eb70d795495a299a1640d7a75f17fb917155a64309b96106e7b9452/langsmith-0.4.4-py3-none-any.whl", hash = "sha256:014c68329bd085bd6c770a6405c61bb6881f82eb554ce8c4d1984b0035fd1716", size = 367687, upload-time = "2025-06-27T19:20:33.839Z" },
 ]
 
+[[package]]
+name = "litellm"
+version = "1.80.7"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "aiohttp" },
+    { name = "click" },
+    { name = "fastuuid" },
+    { name = "grpcio" },
+    { name = "httpx" },
+    { name = "importlib-metadata" },
+    { name = "jinja2" },
+    { name = "jsonschema" },
+    { name = "openai" },
+    { name = "pydantic" },
+    { name = "python-dotenv" },
+    { name = "tiktoken" },
+    { name = "tokenizers" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/a5/3f/af532014449c3931ae6cad2d97d267dd43d0de006060a8cbf0962e004024/litellm-1.80.7.tar.gz", hash = "sha256:3977a8d195aef842d01c18bf9e22984829363c6a4b54daf9a43c9dd9f190b42c", size = 12023127, upload-time = "2025-11-27T23:03:52.474Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/54/e0/2e60a0c09235fd7b55297390c557923f3c35a9cf001914222c26a7857d2b/litellm-1.80.7-py3-none-any.whl", hash = "sha256:f7d993f78c1e0e4e1202b2a925cc6540b55b6e5fb055dd342d88b145ab3102ed", size = 10848321, upload-time = "2025-11-27T23:03:50.002Z" },
+]
+
 [[package]]
 name = "markupsafe"
 version = "3.0.2"
@@ -2157,7 +2306,7 @@ wheels = [
 
 [[package]]
 name = "openai"
-version = "1.95.0"
+version = "2.8.1"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "anyio" },
@@ -2169,9 +2318,9 @@ dependencies = [
     { name = "tqdm" },
     { name = "typing-extensions" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/ef/2f/0c6f509a1585545962bfa6e201d7fb658eb2a6f52fb8c26765632d91706c/openai-1.95.0.tar.gz", hash = "sha256:54bc42df9f7142312647dd485d34cca5df20af825fa64a30ca55164be2cf4cc9", size = 488144, upload-time = "2025-07-10T18:35:49.946Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/d5/e4/42591e356f1d53c568418dc7e30dcda7be31dd5a4d570bca22acb0525862/openai-2.8.1.tar.gz", hash = "sha256:cb1b79eef6e809f6da326a7ef6038719e35aa944c42d081807bfa1be8060f15f", size = 602490, upload-time = "2025-11-17T22:39:59.549Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/19/a5/57d0bb58b938a3e3f352ff26e645da1660436402a6ad1b29780d261cc5a5/openai-1.95.0-py3-none-any.whl", hash = "sha256:a7afc9dca7e7d616371842af8ea6dbfbcb739a85d183f5f664ab1cc311b9ef18", size = 755572, upload-time = "2025-07-10T18:35:47.507Z" },
+    { url = "https://files.pythonhosted.org/packages/55/4f/dbc0c124c40cb390508a82770fb9f6e3ed162560181a85089191a851c59a/openai-2.8.1-py3-none-any.whl", hash = "sha256:c6c3b5a04994734386e8dad3c00a393f56d3b68a27cd2e8acae91a59e4122463", size = 1022688, upload-time = "2025-11-17T22:39:57.675Z" },
 ]
 
 [[package]]