From 203e5cc6c1a79459311d7955efe10a0b5e6e9f7f Mon Sep 17 00:00:00 2001 From: Dom Date: Tue, 21 Apr 2026 10:16:27 +0200 Subject: [PATCH] =?UTF-8?q?fix(grounding):=20d=C3=A9sactiver=20orchestrate?= =?UTF-8?q?ur=20VRAM=20pendant=20ex=C3=A9cution=20+=20qwen2.5vl:3b=20pour?= =?UTF-8?q?=20description?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit L'orchestrateur VRAM redémarrait Ollama en pleine exécution → timeout. Désactivé pendant le workflow. L'orchestrateur reste disponible pour bascule manuelle avant/après. Description ancre via qwen2.5vl:3b (3 Go) au lieu de 7b — tient en VRAM sans décharger CLIP ni RF-DETR. Co-Authored-By: Claude Opus 4.6 (1M context) --- core/execution/input_handler.py | 9 +++------ 1 file changed, 3 insertions(+), 6 deletions(-) diff --git a/core/execution/input_handler.py b/core/execution/input_handler.py index c262edbfe..9eff35955 100644 --- a/core/execution/input_handler.py +++ b/core/execution/input_handler.py @@ -286,10 +286,6 @@ Si tu vois un dialogue ou une popup, indique quel bouton cliquer. Si l'écran est normal sans action nécessaire, réponds action="nothing". Réponds UNIQUEMENT le JSON, pas d'explication.""" - from core.cognition.vram_orchestrator import get_orchestrator - orch = get_orchestrator() - orch.ensure_reasoning_ready() - ollama_url = os.environ.get("OLLAMA_URL", "http://localhost:11434") model = os.environ.get("RPA_REASONING_MODEL", "qwen2.5vl:7b") @@ -402,8 +398,9 @@ def _describe_anchor_image(anchor_image_base64: str) -> Optional[str]: anchor_image_base64 = anchor_image_base64.split(',', 1)[1] ollama_url = os.environ.get("OLLAMA_URL", "http://localhost:11434") - model = os.environ.get("RPA_REASONING_MODEL", "qwen2.5vl:7b") + model = "qwen2.5vl:3b" + logger.info(f"[Grounding] Description ancre via {model}...") response = requests.post( f"{ollama_url}/api/generate", json={ @@ -413,7 +410,7 @@ def _describe_anchor_image(anchor_image_base64: str) -> Optional[str]: "stream": False, "options": {"temperature": 0.1, "num_predict": 20} }, - timeout=15 + timeout=30 ) if response.status_code == 200: