Increase Ollama request timeout to handle slow cloud models

- Set timeout to 300 seconds (5 minutes) for total request - Set connect timeout to 60 seconds - This fixes httpx.ReadTimeout errors with Ollama cloud models - Cloud models may take longer to respond than local instances

Increase Ollama request timeout to handle slow cloud models
- Set timeout to 300 seconds (5 minutes) for total request - Set connect timeout to 60 seconds - This fixes httpx.ReadTimeout errors with Ollama cloud models - Cloud models may take longer to respond than local instances
6de38561 · Stefy Lanza (nextime / spora ) · 0cb155b5 · 6de38561
Commit 6de38561 authored Feb 06, 2026 by Stefy Lanza (nextime / spora )
Show whitespace changes
Inline Side-by-side

Showing with 3 additions and 1 deletion

providers.py aisbf/providers.py +3 -1

No files found.
--- a/aisbf/providers.py
+++ b/aisbf/providers.py
@@ -251,7 +251,9 @@ class AnthropicProviderHandler(BaseProviderHandler):
 class OllamaProviderHandler(BaseProviderHandler):
    def __init__(self, provider_id: str, api_key: Optional[str] = None):
        super().__init__(provider_id, api_key)
-        self.client = httpx.AsyncClient(base_url=config.providers[provider_id].endpoint)
+        # Increase timeout for Ollama requests (especially for cloud models)
+        timeout = httpx.Timeout(300.0, connect=60.0)  # 5 minutes total, 60 seconds to connect
+        self.client = httpx.AsyncClient(base_url=config.providers[provider_id].endpoint, timeout=timeout)

    async def handle_request(self, model: str, messages: List[Dict], max_tokens: Optional[int] = None,
                           temperature: Optional[float] = 1.0, stream: Optional[bool] = False) -> Dict: