Skip to content

Commit

Permalink
disable timeouts, set max replicas to 10 (max we get for free)
Browse files Browse the repository at this point in the history
  • Loading branch information
KastanDay committed Feb 22, 2024
1 parent aa70cc5 commit 316b1bd
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions ai_ta_backend/beam/ingest.py
Original file line number Diff line number Diff line change
Expand Up @@ -138,11 +138,11 @@ def loader():


# autoscaler = RequestLatencyAutoscaler(desired_latency=30, max_replicas=2)
autoscaler = QueueDepthAutoscaler(max_tasks_per_replica=30, max_replicas=3)
autoscaler = QueueDepthAutoscaler(max_tasks_per_replica=30, max_replicas=10)


# Triggers determine how your app is deployed
@app.rest_api(max_pending_tasks=10_000, max_retries=3, loader=loader, autoscaler=autoscaler)
@app.rest_api(max_pending_tasks=10_000, max_retries=3, loader=loader, autoscaler=autoscaler, timeout=-1)
def ingest(**inputs: Dict[str, Any]):
qdrant_client, vectorstore, s3_client, supabase_client, posthog = inputs["context"]

Expand Down

0 comments on commit 316b1bd

Please sign in to comment.