v1.0 - Version stable: multi-PC, détection UI-DETR-1, 3 modes exécution

- Frontend v4 accessible sur réseau local (192.168.1.40) - Ports ouverts: 3002 (frontend), 5001 (backend), 5004 (dashboard) - Ollama GPU fonctionnel - Self-healing interactif - Dashboard confiance Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
2026-01-29 11:23:51 +01:00
parent 21bfa3b337
commit a27b74cf22
1595 changed files with 412691 additions and 400 deletions
--- a/examples/test_ollama_integration.py
+++ b/examples/test_ollama_integration.py
@@ -0,0 +1,145 @@
+"""
+Script de test pour l'intégration Ollama avec UIDetector
+
+Ce script montre comment utiliser le UIDetector avec Ollama pour
+détecter et classifier des éléments UI dans des screenshots.
+"""
+
+import sys
+from pathlib import Path
+
+# Ajouter le répertoire parent au path
+sys.path.insert(0, str(Path(__file__).parent.parent))
+
+from core.detection import (
+    UIDetector,
+    DetectionConfig,
+    OllamaClient,
+    check_ollama_available
+)
+
+
+def test_ollama_connection():
+    """Tester la connexion à Ollama"""
+    print("=" * 60)
+    print("Test 1: Vérification de la connexion Ollama")
+    print("=" * 60)
+    
+    if check_ollama_available():
+        print("✅ Ollama est disponible!")
+        
+        # Lister les modèles
+        client = OllamaClient()
+        models = client.list_models()
+        print(f"\nModèles disponibles: {models}")
+        
+        return True
+    else:
+        print("❌ Ollama n'est pas disponible")
+        print("\nPour installer Ollama:")
+        print("1. Visitez: https://ollama.ai")
+        print("2. Téléchargez et installez Ollama")
+        print("3. Lancez: ollama pull qwen2.5-vl")
+        print("4. Vérifiez: ollama list")
+        
+        return False
+
+
+def test_ui_detector_with_ollama(screenshot_path: str):
+    """Tester le UIDetector avec Ollama"""
+    print("\n" + "=" * 60)
+    print("Test 2: Détection UI avec Ollama")
+    print("=" * 60)
+    
+    # Créer client Ollama
+    ollama_client = OllamaClient(model="qwen3-vl:8b")
+    
+    # Créer UIDetector
+    config = DetectionConfig(
+        vlm_model="qwen3-vl:8b",
+        confidence_threshold=0.7,
+        detect_regions=True
+    )
+    detector = UIDetector(config)
+    
+    # Brancher Ollama au détecteur
+    detector.set_vlm_client(ollama_client)
+    
+    # Détecter éléments UI
+    print(f"\nAnalyse du screenshot: {screenshot_path}")
+    elements = detector.detect(screenshot_path)
+    
+    print(f"\n✅ {len(elements)} éléments UI détectés:")
+    for i, elem in enumerate(elements, 1):
+        print(f"\n  {i}. {elem.type.upper()} - {elem.role}")
+        print(f"     Position: {elem.bbox}")
+        print(f"     Label: {elem.label}")
+        print(f"     Confiance: {elem.confidence:.2f}")
+
+
+def test_element_classification():
+    """Tester la classification d'éléments"""
+    print("\n" + "=" * 60)
+    print("Test 3: Classification d'éléments")
+    print("=" * 60)
+    
+    client = OllamaClient(model="qwen2.5-vl")
+    
+    # Test avec une image fictive
+    from PIL import Image
+    import numpy as np
+    
+    # Créer une image de test (bouton bleu)
+    img_array = np.zeros((50, 150, 3), dtype=np.uint8)
+    img_array[:, :] = [0, 100, 200]  # Bleu
+    test_image = Image.fromarray(img_array)
+    
+    # Classifier le type
+    print("\nClassification du type...")
+    type_result = client.classify_element_type(test_image)
+    if type_result["success"]:
+        print(f"✅ Type: {type_result['type']} (confiance: {type_result['confidence']:.2f})")
+    else:
+        print("❌ Échec de classification")
+    
+    # Classifier le rôle
+    print("\nClassification du rôle...")
+    role_result = client.classify_element_role(test_image, "button")
+    if role_result["success"]:
+        print(f"✅ Rôle: {role_result['role']} (confiance: {role_result['confidence']:.2f})")
+    else:
+        print("❌ Échec de classification")
+
+
+def main():
+    """Fonction principale"""
+    print("\n" + "=" * 60)
+    print("TEST D'INTÉGRATION OLLAMA + UIDetector")
+    print("=" * 60)
+    
+    # Test 1: Connexion Ollama
+    if not test_ollama_connection():
+        print("\n⚠️  Ollama n'est pas disponible. Tests limités.")
+        return
+    
+    # Test 2: Détection UI (si screenshot fourni)
+    if len(sys.argv) > 1:
+        screenshot_path = sys.argv[1]
+        if Path(screenshot_path).exists():
+            test_ui_detector_with_ollama(screenshot_path)
+        else:
+            print(f"\n❌ Screenshot non trouvé: {screenshot_path}")
+    else:
+        print("\n💡 Pour tester la détection UI:")
+        print("   python test_ollama_integration.py <chemin_screenshot>")
+    
+    # Test 3: Classification
+    test_element_classification()
+    
+    print("\n" + "=" * 60)
+    print("Tests terminés!")
+    print("=" * 60)
+
+
+if __name__ == "__main__":
+    main()