diff --git a/signal_engine/extract/backends.py b/signal_engine/extract/backends.py index b80b073..83ad2b2 100644 --- a/signal_engine/extract/backends.py +++ b/signal_engine/extract/backends.py @@ -50,6 +50,10 @@ class GeminiBackend: temperature=0, max_output_tokens=max_tokens, response_mime_type="application/json", + # Gemini 2.5 thinks by default and spends the output budget on reasoning tokens — + # it hit MAX_TOKENS with ~3.8k thoughts and a truncated JSON body (0 claims parsed). + # Extraction is deterministic, no-CoT (mirrors the local path's enable_thinking=False). + thinking_config=types.ThinkingConfig(thinking_budget=0), ), ) return resp.text or "{}"