fix: address gold-standard review findings

saschabuehrle · saschabuehrle · commit 405fc4528752 · 2026-03-08T16:38:45.000+01:00
Critical:
- Remove rich from requirements.txt (now optional in pyproject.toml)
- Fix stale tiers=DEFAULT_TIERS warning messages referencing removed param
- Complete @xenova/transformers → @huggingface/transformers migration
  across all TS packages, docs, examples, and CI config
- Revert workspace:* → workspace:^ (preserves semver on publish)

Security:
- Use hmac.compare_digest for constant-time auth token comparison
- Guard record() with _lock for thread-safe counter reads

Quality:
- Preserve _LazyModule.__name__ alias after dict merge
- Add __bool__=False to _MissingIntegration for truthiness compat
- Fix CHANGELOG import time to match actual measurement (~20ms)
- Fix import ordering (ruff I001)
diff --git a/.github/models.yml b/.github/models.yml
@@ -47,7 +47,7 @@ ml_models:
 
     installation:
       python: "pip install fastembed"
-      typescript: "npm install @xenova/transformers"
+      typescript: "npm install @huggingface/transformers"
 
 # Heuristic Models (No ML Required)
 heuristic_models:
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -33,7 +33,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 
 ### Changed
 
-- **Lazy imports** — `import cascadeflow` no longer eagerly loads all providers, numpy, or heavyweight submodules. Import time reduced from ~1900ms to <200ms.
+- **Lazy imports** — `import cascadeflow` no longer eagerly loads all providers, numpy, or heavyweight submodules. Import time reduced from ~1900ms to ~20ms via PEP 562 lazy loading.
 - **`__all__` reduced** — From 127 to ~20 essential public symbols. Non-essential exports remain accessible but are not star-exported.
 - **`rich` moved to optional** — No longer a core dependency; falls back to stdlib logging when not installed. Install with `pip install cascadeflow[rich]`.
 - **Integration import errors** — Failed optional integration imports now return proxy objects that raise `ImportError` with install hints on use, instead of silently returning `None`.
diff --git a/README.md b/README.md
@@ -289,7 +289,7 @@ For advanced quality validation, enable ML-based semantic similarity checking to
 **Step 1:** Install the optional ML packages:
 
 ```bash
-npm install @cascadeflow/ml @xenova/transformers
+npm install @cascadeflow/ml @huggingface/transformers
 ```
 
 **Step 2:** Enable semantic validation in your cascade:
diff --git a/cascadeflow/__init__.py b/cascadeflow/__init__.py
@@ -46,8 +46,10 @@ def _load(self):
         if not self.__loaded:
             import importlib
 
+            alias = self.__name__
             real = importlib.import_module(self.__real_name)
             self.__dict__.update(real.__dict__)
+            self.__name__ = alias  # preserve alias name after dict merge
             self.__loaded = True
 
     def __getattr__(self, name: str):
diff --git a/cascadeflow/agent.py b/cascadeflow/agent.py
@@ -974,7 +974,7 @@ async def run(
             logger.warning(
                 f"user_tier='{user_tier}' specified but no tiers configured. "
                 f"Ignoring tier parameter. To use tiers, initialize agent with: "
-                f"CascadeAgent(models=[...], tiers=DEFAULT_TIERS)"
+                f"HarnessConfig with tier-based rules"
             )
 
         workflow_profile = None
@@ -1402,7 +1402,7 @@ async def run_streaming(
             logger.warning(
                 f"user_tier='{user_tier}' specified but no tiers configured. "
                 f"Ignoring tier parameter. To use tiers, initialize agent with: "
-                f"CascadeAgent(models=[...], tiers=DEFAULT_TIERS)"
+                f"HarnessConfig with tier-based rules"
             )
 
         workflow_profile = None
@@ -1681,7 +1681,7 @@ async def stream_events(
             logger.warning(
                 f"user_tier='{user_tier}' specified but no tiers configured. "
                 f"Ignoring tier parameter. To use tiers, initialize agent with: "
-                f"CascadeAgent(models=[...], tiers=DEFAULT_TIERS)"
+                f"HarnessConfig with tier-based rules"
             )
 
         workflow_profile = None
diff --git a/cascadeflow/harness/api.py b/cascadeflow/harness/api.py
@@ -187,30 +187,31 @@ def record(
             _sanitize_trace_value(model, max_length=_MAX_MODEL_LEN) if model is not None else None
         )
 
-        self.last_action = safe_action
-        self.model_used = safe_model
-        entry: dict[str, Any] = {
-            "action": safe_action,
-            "reason": safe_reason,
-            "model": safe_model,
-            "run_id": self.run_id,
-            "mode": self.mode,
-            "step": self.step_count,
-            "timestamp_ms": time.time() * 1000,
-            "tool_calls_total": self.tool_calls,
-            "cost_total": self.cost,
-            "latency_used_ms": self.latency_used_ms,
-            "energy_used": self.energy_used,
-            "budget_state": {
-                "max": self.budget_max,
-                "remaining": self.budget_remaining,
-            },
-        }
-        if applied is not None:
-            entry["applied"] = applied
-        if decision_mode is not None:
-            entry["decision_mode"] = decision_mode
-        self._trace.append(entry)
+        with self._lock:
+            self.last_action = safe_action
+            self.model_used = safe_model
+            entry: dict[str, Any] = {
+                "action": safe_action,
+                "reason": safe_reason,
+                "model": safe_model,
+                "run_id": self.run_id,
+                "mode": self.mode,
+                "step": self.step_count,
+                "timestamp_ms": time.time() * 1000,
+                "tool_calls_total": self.tool_calls,
+                "cost_total": self.cost,
+                "latency_used_ms": self.latency_used_ms,
+                "energy_used": self.energy_used,
+                "budget_state": {
+                    "max": self.budget_max,
+                    "remaining": self.budget_remaining,
+                },
+            }
+            if applied is not None:
+                entry["applied"] = applied
+            if decision_mode is not None:
+                entry["decision_mode"] = decision_mode
+            self._trace.append(entry)
         _emit_harness_decision(entry)
 
 
diff --git a/cascadeflow/integrations/__init__.py b/cascadeflow/integrations/__init__.py
@@ -39,6 +39,9 @@ def __call__(self, *args, **kwargs):
     def __getattr__(self, name: str):
         self._fail()
 
+    def __bool__(self):
+        return False
+
     def __repr__(self):
         return f"<MissingIntegration {self._name!r}>"
 
diff --git a/cascadeflow/proxy/server.py b/cascadeflow/proxy/server.py
@@ -24,6 +24,7 @@
 
 import asyncio
 import hashlib
+import hmac
 import inspect
 import json
 import os
@@ -619,7 +620,8 @@ def _check_auth(self, proxy: RoutingProxy) -> bool:
         if not token:
             return True
         auth = self.headers.get("Authorization", "")
-        if auth == f"Bearer {token}":
+        expected = f"Bearer {token}"
+        if hmac.compare_digest(auth, expected):
             return True
         self.send_response(401)
         self.send_header("Content-Type", "application/json")
diff --git a/cascadeflow/routing/tier_routing.py b/cascadeflow/routing/tier_routing.py
@@ -2,16 +2,12 @@
 Tier-aware routing for user tier management.
 
 This module provides tier-based model filtering and budget enforcement.
-It's OPTIONAL - only activated when users provide 'tiers' parameter.
+It's OPTIONAL - only activated when tier rules are configured via HarnessConfig.
 
 Usage:
     >>> from cascadeflow import CascadeAgent
-    >>> from cascadeflow.schema.config import DEFAULT_TIERS
     >>>
-    >>> # OPTIONAL: Enable tier routing
-    >>> agent = CascadeAgent(models=[...], tiers=DEFAULT_TIERS)
-    >>>
-    >>> # Use tier-aware routing
+    >>> # Use tier-aware routing via HarnessConfig
     >>> result = await agent.run("query", user_tier="free")
     >>>
     >>> # Or ignore tiers - works without them
diff --git a/docs/guides/custom_validation.md b/docs/guides/custom_validation.md
@@ -904,7 +904,7 @@ if (await checker.isAvailable()) {
 
 **Installation:**
 ```bash
-npm install @cascadeflow/ml @xenova/transformers
+npm install @cascadeflow/ml @huggingface/transformers
 ```
 
 ---
diff --git a/packages/core/examples/README.md b/packages/core/examples/README.md
@@ -251,7 +251,7 @@ ML-based semantic validation using embeddings.
 
 **Installation:**
 ```bash
-npm install @cascadeflow/ml @xenova/transformers
+npm install @cascadeflow/ml @huggingface/transformers
 ```
 
 **Example:**
@@ -406,7 +406,7 @@ npx tsx production-patterns.ts
 npm install @cascadeflow/core
 
 # For semantic quality example
-npm install @cascadeflow/ml @xenova/transformers
+npm install @cascadeflow/ml @huggingface/transformers
 
 # Install peer dependencies for providers you'll use
 npm install openai                    # OpenAI
@@ -568,7 +568,7 @@ npm install @cascadeflow/core
 npm install openai @anthropic-ai/sdk groq-sdk
 
 # For semantic quality
-npm install @cascadeflow/ml @xenova/transformers
+npm install @cascadeflow/ml @huggingface/transformers
 ```
 </details>
 
diff --git a/packages/core/examples/nodejs/semantic-quality.ts b/packages/core/examples/nodejs/semantic-quality.ts
@@ -15,11 +15,11 @@
  * Requirements:
  *     - @cascadeflow/core
  *     - @cascadeflow/ml (for embeddings)
- *     - @xenova/transformers (ONNX runtime for embeddings)
+ *     - @huggingface/transformers (ONNX runtime for embeddings)
  *     - OpenAI API key
  *
  * Setup:
- *     npm install @cascadeflow/core @cascadeflow/ml @xenova/transformers
+ *     npm install @cascadeflow/core @cascadeflow/ml @huggingface/transformers
  *     export OPENAI_API_KEY="your-key-here"
  *     npx tsx semantic-quality.ts
  *
@@ -79,7 +79,7 @@ async function main() {
     console.log('❌ ML dependencies not available!');
     console.log();
     console.log('To use semantic validation, install:');
-    console.log('   npm install @cascadeflow/ml @xenova/transformers');
+    console.log('   npm install @cascadeflow/ml @huggingface/transformers');
     console.log();
     console.log('The BGE-small-en-v1.5 model (~40MB) will auto-download on first use.');
     console.log();
diff --git a/packages/core/package.json b/packages/core/package.json
@@ -63,7 +63,7 @@
   "peerDependencies": {
     "@anthropic-ai/sdk": "^0.30.0",
     "@huggingface/inference": "^2.8.0",
-    "@xenova/transformers": "^2.17.2",
+    "@huggingface/transformers": "^3.0.0",
     "groq-sdk": "^0.5.0",
     "openai": "^4.0.0"
   },
@@ -80,7 +80,7 @@
     "@huggingface/inference": {
       "optional": true
     },
-    "@xenova/transformers": {
+    "@huggingface/transformers": {
       "optional": true
     }
   },
diff --git a/packages/core/src/quality-semantic.ts b/packages/core/src/quality-semantic.ts
@@ -64,7 +64,7 @@ export interface SemanticQualityResult {
  * not installed.
  *
  * Installation:
- *   npm install @cascadeflow/ml @xenova/transformers
+ *   npm install @cascadeflow/ml @huggingface/transformers
  *
  * The embedding model (~40MB) will auto-download on first use.
  */
@@ -137,7 +137,7 @@ export class SemanticQualityChecker {
       const err = error as { code?: string; message?: string };
       if (err?.code === 'ERR_MODULE_NOT_FOUND' || err?.message?.includes('Cannot find module')) {
         console.warn(
-          '@cascadeflow/ml not available. Install with: npm install @cascadeflow/ml @xenova/transformers'
+          '@cascadeflow/ml not available. Install with: npm install @cascadeflow/ml @huggingface/transformers'
         );
       } else {
         const message = error instanceof Error ? error.message : String(error);
diff --git a/packages/langchain-cascadeflow/package.json b/packages/langchain-cascadeflow/package.json
@@ -48,8 +48,8 @@
     "typescript"
   ],
   "dependencies": {
-    "@cascadeflow/core": "workspace:*",
-    "@cascadeflow/ml": "workspace:*",
+    "@cascadeflow/core": "workspace:^",
+    "@cascadeflow/ml": "workspace:^",
     "@langchain/anthropic": "^1.3.13",
     "@langchain/google-genai": "^1.0.3"
   },
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
diff --git a/requirements.txt b/requirements.txt