Skip to content

Commit deefede

Browse files
authored
Merge pull request #165 from ridgesai/hobbleabbas-patch-7
Increase load balancing for glm4.5fp8 to targon
2 parents 3c8c32c + 598c6c3 commit deefede

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

proxy/providers/inference_manager.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -38,7 +38,7 @@ def _find_provider(self, model: str) -> InferenceProvider:
3838
if (
3939
self.targon.supports_model(model)
4040
and self.targon.is_available()
41-
and random.random() < 0.25
41+
and random.random() < 0.5
4242
):
4343
return self.targon
4444

@@ -153,4 +153,4 @@ async def inference(
153153
return {"error": f"{primary_provider.name} error: {response_text} | {fallback_provider.name} fallback also failed: {fallback_response}"}
154154

155155
# No fallback available or model doesn't support fallback
156-
return {"error": f"Error in inference request: {response_text}"}
156+
return {"error": f"Error in inference request: {response_text}"}

0 commit comments

Comments
 (0)