feat(cache): ScreenStateCache clé composite context-aware (Lot D)

Avant : clé = phash seul -> deux contextes différents avec même screenshot partageaient la même entrée cache -> collisions silencieuses. Après : clé composite {phash}|{md5(ctx)[:16]} avec ctx = - window_title - app_name - enable_ocr - enable_ui_detection - workflow_id (isolation inter-workflows) get_or_compute() kwargs-only. TTL 2s et éviction LRU inchangés. invalidate_if_changed() continue de comparer uniquement les phash. ExecutionLoop propage tout le contexte au cache. 8 nouveaux tests prouvant : - même image + window différent = miss - même image + app différent = miss - même image + flags différents = miss - même image + workflow_id différent = miss - même image + même contexte = hit Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
2026-04-15 09:06:51 +02:00
parent 9ca277a63f
commit c8a3618e27
2 changed files with 858 additions and 0 deletions
--- a/core/pipeline/screen_state_cache.py
+++ b/core/pipeline/screen_state_cache.py
@@ -0,0 +1,409 @@
+"""
+ScreenStateCache — Cache perceptuel de ScreenState (context-aware).
+
+Objectif : éviter de réanalyser un screenshot identique (5-15s VLM/OCR)
+à chaque step de la boucle d'exécution.
+
+Principe (Lot D — avril 2026) :
+  - Clé = composite de 6 éléments pour éviter les collisions silencieuses
+    entre contextes différents partageant un même screenshot :
+      1. phash (dhash 8x8 du screenshot) — calculé en ~2-5ms
+      2. window_title (titre fenêtre active)
+      3. app_name (nom process actif)
+      4. enable_ocr (flag runtime)
+      5. enable_ui_detection (flag runtime)
+      6. workflow_id (isolation inter-workflows)
+  - TTL par défaut : 2 secondes (configurable)
+  - Invalidation explicite possible (par clé composite ou globale)
+  - invalidate_if_changed reste piloté par le phash seul (détection de
+    changement visuel majeur, indépendant du contexte)
+  - Thread-safe (lock interne)
+
+API principale :
+  >>> cache = ScreenStateCache(ttl_seconds=2.0)
+  >>> state, hit, ms = cache.get_or_compute(
+  ...     screenshot_path, compute_fn,
+  ...     window_title="App", app_name="app.exe",
+  ...     enable_ocr=True, enable_ui_detection=True,
+  ...     workflow_id="wf_123",
+  ... )
+
+La fonction `compute_fn` prend le chemin du screenshot et doit retourner
+un `ScreenState`. Elle n'est appelée qu'en cache miss.
+"""
+
+from __future__ import annotations
+
+import hashlib
+import logging
+import threading
+import time
+from dataclasses import dataclass
+from pathlib import Path
+from typing import Callable, Optional, Tuple
+
+from PIL import Image
+
+from core.models.screen_state import ScreenState
+
+logger = logging.getLogger(__name__)
+
+
+# =============================================================================
+# Hash perceptuel (dhash simple, sans dépendance imagehash)
+# =============================================================================
+
+
+def _hamming_distance_hex(a: str, b: str) -> int:
+    """
+    Distance de Hamming entre deux chaînes hexadécimales de même longueur.
+
+    Retourne le nombre de bits qui diffèrent entre les deux hashes.
+    Si les longueurs diffèrent, on pad à droite par des zéros.
+    """
+    if len(a) != len(b):
+        max_len = max(len(a), len(b))
+        a = a.ljust(max_len, "0")
+        b = b.ljust(max_len, "0")
+    try:
+        xor = int(a, 16) ^ int(b, 16)
+        return bin(xor).count("1")
+    except ValueError:
+        # Fallback : comparaison caractère à caractère
+        return sum(1 for ca, cb in zip(a, b) if ca != cb) * 4
+
+
+def compute_perceptual_hash(screenshot_path: str, size: int = 8) -> str:
+    """
+    Calculer un dhash (difference hash) pour un screenshot.
+
+    Algorithme :
+      1. Convertir en niveaux de gris
+      2. Redimensionner à (size+1) x size
+      3. Comparer chaque pixel avec son voisin de droite (dhash)
+      4. Retourner un hash hexadécimal de size*size bits
+
+    Robuste aux petites variations (curseur, blink, compression).
+    Coût typique : 2-5 ms sur un 1920x1080.
+
+    Args:
+        screenshot_path: Chemin vers le fichier image
+        size: Taille du hash (8 = 64 bits, défaut)
+
+    Returns:
+        Chaîne hexadécimale (size*size/4 caractères)
+    """
+    try:
+        img = Image.open(screenshot_path)
+        img = img.convert("L").resize((size + 1, size), Image.LANCZOS)
+        pixels = list(img.getdata())
+
+        # dhash : comparer chaque pixel avec celui de droite
+        bits = []
+        for row in range(size):
+            for col in range(size):
+                left = pixels[row * (size + 1) + col]
+                right = pixels[row * (size + 1) + col + 1]
+                bits.append(1 if left > right else 0)
+
+        # Convertir en hex
+        value = 0
+        for bit in bits:
+            value = (value << 1) | bit
+        return format(value, f"0{size * size // 4}x")
+    except Exception as e:
+        logger.warning(f"Hash perceptuel échoué pour {screenshot_path}: {e}")
+        # Fallback : hash du contenu brut
+        try:
+            data = Path(screenshot_path).read_bytes()
+            return hashlib.md5(data).hexdigest()[:16]
+        except Exception:
+            return f"unhashable_{int(time.time() * 1000)}"
+
+
+# =============================================================================
+# Clé composite (Lot D)
+# =============================================================================
+
+
+def _make_cache_key(
+    phash: str,
+    window_title: str,
+    app_name: str,
+    enable_ocr: bool,
+    enable_ui_detection: bool,
+    workflow_id: str,
+) -> str:
+    """
+    Construire une clé composite stable pour le cache.
+
+    Combine les 6 dimensions du contexte d'exécution dans une chaîne
+    hexadécimale (md5 tronqué à 16 caractères), préfixée par le phash pour
+    conserver une lisibilité minimale en debug (log : `aabb…|ctx=1234…`).
+
+    NB : On hash plutôt que concaténer brut pour :
+      - Borner la taille de la clé même si window_title est long
+      - Éviter les collisions triviales (séparateur présent dans un titre)
+      - Rendre la clé opaque (pas de PII en clair dans les logs de cache)
+
+    Args:
+        phash: Hash perceptuel du screenshot (dhash 8x8)
+        window_title: Titre de la fenêtre active (str)
+        app_name: Nom du process actif (str)
+        enable_ocr: Flag runtime OCR (bool)
+        enable_ui_detection: Flag runtime détection UI (bool)
+        workflow_id: ID du workflow en cours (str, "" pour legacy)
+
+    Returns:
+        Clé composite `{phash}|{ctx_hash}` où ctx_hash = md5(16)
+    """
+    # Sérialisation déterministe ; `|` comme séparateur interne puisque hashé.
+    ctx_repr = (
+        f"{window_title or ''}\x1f"
+        f"{app_name or ''}\x1f"
+        f"{int(bool(enable_ocr))}\x1f"
+        f"{int(bool(enable_ui_detection))}\x1f"
+        f"{workflow_id or ''}"
+    )
+    ctx_hash = hashlib.md5(ctx_repr.encode("utf-8")).hexdigest()[:16]
+    return f"{phash}|{ctx_hash}"
+
+
+# =============================================================================
+# Entry
+# =============================================================================
+
+
+@dataclass
+class _CacheEntry:
+    state: ScreenState
+    created_at: float
+    phash: str  # phash seul (utilisé par invalidate_if_changed)
+
+
+# =============================================================================
+# Cache
+# =============================================================================
+
+
+class ScreenStateCache:
+    """
+    Cache de ScreenState avec TTL et clé composite context-aware.
+
+    Thread-safe. Utilise un lock interne pour les opérations get/set.
+    """
+
+    def __init__(self, ttl_seconds: float = 2.0, max_entries: int = 16):
+        """
+        Args:
+            ttl_seconds: Durée de vie d'une entrée (en secondes)
+            max_entries: Nombre max d'entrées avant éviction LRU simple
+        """
+        self.ttl_seconds = ttl_seconds
+        self.max_entries = max_entries
+        # Clé = composite (_make_cache_key), valeur = _CacheEntry
+        self._store: dict[str, _CacheEntry] = {}
+        self._lock = threading.Lock()
+
+        # Métriques simples (utile pour le debug / logs)
+        self.hits = 0
+        self.misses = 0
+        self.invalidations = 0
+
+    # -------------------------------------------------------------------------
+    # API bas niveau (par clé composite)
+    # -------------------------------------------------------------------------
+
+    def _get(self, composite_key: str) -> Optional[ScreenState]:
+        """Retourne l'entrée pour cette clé composite si encore valide."""
+        with self._lock:
+            entry = self._store.get(composite_key)
+            if entry is None:
+                return None
+            if time.time() - entry.created_at > self.ttl_seconds:
+                # Expiré
+                self._store.pop(composite_key, None)
+                return None
+            return entry.state
+
+    def _set(self, composite_key: str, phash: str, state: ScreenState) -> None:
+        """Enregistre un état pour cette clé composite."""
+        with self._lock:
+            # Éviction simple : si plein, virer l'entrée la plus ancienne
+            if (
+                len(self._store) >= self.max_entries
+                and composite_key not in self._store
+            ):
+                oldest_key = min(
+                    self._store, key=lambda k: self._store[k].created_at
+                )
+                self._store.pop(oldest_key, None)
+
+            self._store[composite_key] = _CacheEntry(
+                state=state,
+                created_at=time.time(),
+                phash=phash,
+            )
+
+    def invalidate(self, composite_key: Optional[str] = None) -> None:
+        """
+        Invalider une entrée ou tout le cache.
+
+        Args:
+            composite_key: Clé à invalider. Si None, vide tout le cache.
+        """
+        with self._lock:
+            if composite_key is None:
+                self._store.clear()
+            else:
+                self._store.pop(composite_key, None)
+            self.invalidations += 1
+
+    def invalidate_if_changed(
+        self,
+        screenshot_path: str,
+        threshold: float = 0.3,
+    ) -> bool:
+        """
+        Invalider le cache si l'écran a suffisamment changé.
+
+        Compare le dhash du screenshot courant avec le phash (seul) de chaque
+        entrée du cache. La décision est volontairement indépendante du reste
+        de la clé composite : un changement visuel majeur rend toutes les
+        entrées obsolètes, quel que soit le contexte.
+
+        Args:
+            screenshot_path: Chemin du screenshot courant
+            threshold: Proportion de bits qui doivent différer (0.0-1.0).
+                0.3 = 30% (~19 bits sur 64) = changement significatif.
+
+        Returns:
+            True si le cache a été invalidé, False sinon.
+        """
+        if not self._store:
+            return False
+
+        current_phash = compute_perceptual_hash(screenshot_path)
+
+        # Bits totaux : 64 pour un dhash 8x8 standard. On déduit via la
+        # longueur hexa du hash courant pour rester générique.
+        total_bits = len(current_phash) * 4
+        if total_bits == 0:
+            return False
+
+        threshold_bits = threshold * total_bits
+
+        with self._lock:
+            if not self._store:
+                return False
+
+            # Distance de Hamming minimale avec les phashes des entrées
+            # (on regarde entry.phash, pas la clé composite).
+            min_distance = None
+            for entry in self._store.values():
+                distance = _hamming_distance_hex(current_phash, entry.phash)
+                if min_distance is None or distance < min_distance:
+                    min_distance = distance
+
+            if min_distance is not None and min_distance > threshold_bits:
+                size_before = len(self._store)
+                self._store.clear()
+                self.invalidations += 1
+                logger.debug(
+                    f"[ScreenStateCache] invalidate_if_changed: "
+                    f"distance={min_distance}/{total_bits} > "
+                    f"threshold={threshold_bits:.1f} → {size_before} entrées purgées"
+                )
+                return True
+            return False
+
+    # -------------------------------------------------------------------------
+    # API haut niveau (context-aware)
+    # -------------------------------------------------------------------------
+
+    def get_or_compute(
+        self,
+        screenshot_path: str,
+        compute_fn: Callable[[str], ScreenState],
+        *,
+        window_title: str = "",
+        app_name: str = "",
+        enable_ocr: bool = True,
+        enable_ui_detection: bool = True,
+        workflow_id: str = "",
+        force_refresh: bool = False,
+    ) -> Tuple[ScreenState, bool, float]:
+        """
+        Récupérer ou calculer le ScreenState pour un screenshot + contexte.
+
+        Clé de cache = composite(phash, window_title, app_name, enable_ocr,
+        enable_ui_detection, workflow_id). Deux contextes différents partageant
+        le même screenshot n'entrent PAS en collision.
+
+        Rétrocompatibilité : tous les kwargs de contexte ont une valeur par
+        défaut. Un caller legacy qui n'a pas encore été adapté partagera la
+        même entrée de cache qu'un autre caller legacy (comportement antérieur).
+
+        Args:
+            screenshot_path: Chemin du screenshot
+            compute_fn: Fonction qui construit un ScreenState si cache miss
+            window_title: Titre de la fenêtre active (contexte visuel)
+            app_name: Nom du process actif (contexte applicatif)
+            enable_ocr: Flag runtime — différencie états avec/sans OCR
+            enable_ui_detection: Flag runtime — différencie états avec/sans UI
+            workflow_id: ID du workflow — isolation inter-workflows
+            force_refresh: Ignorer le cache et recalculer
+
+        Returns:
+            Tuple (state, cache_hit, elapsed_ms)
+        """
+        t0 = time.time()
+        phash = compute_perceptual_hash(screenshot_path)
+        composite_key = _make_cache_key(
+            phash=phash,
+            window_title=window_title,
+            app_name=app_name,
+            enable_ocr=enable_ocr,
+            enable_ui_detection=enable_ui_detection,
+            workflow_id=workflow_id,
+        )
+
+        if not force_refresh:
+            cached = self._get(composite_key)
+            if cached is not None:
+                self.hits += 1
+                elapsed_ms = (time.time() - t0) * 1000
+                logger.debug(
+                    f"[ScreenStateCache] HIT key={composite_key[:24]}… "
+                    f"({elapsed_ms:.1f}ms)"
+                )
+                return cached, True, elapsed_ms
+
+        # Cache miss → calcul complet
+        self.misses += 1
+        state = compute_fn(screenshot_path)
+        self._set(composite_key, phash, state)
+        elapsed_ms = (time.time() - t0) * 1000
+        logger.debug(
+            f"[ScreenStateCache] MISS key={composite_key[:24]}… "
+            f"({elapsed_ms:.1f}ms)"
+        )
+        return state, False, elapsed_ms
+
+    def stats(self) -> dict:
+        """Retourne les métriques du cache."""
+        with self._lock:
+            total = self.hits + self.misses
+            return {
+                "hits": self.hits,
+                "misses": self.misses,
+                "invalidations": self.invalidations,
+                "hit_rate": self.hits / total if total > 0 else 0.0,
+                "size": len(self._store),
+                "max_entries": self.max_entries,
+                "ttl_seconds": self.ttl_seconds,
+            }
+
+    def __len__(self) -> int:
+        with self._lock:
+            return len(self._store)
--- a/tests/unit/test_screen_state_cache.py
+++ b/tests/unit/test_screen_state_cache.py
@@ -0,0 +1,449 @@
+"""
+Tests unitaires du ScreenStateCache.
+
+Couvre :
+  - Hash perceptuel (déterministe, stable sur même image, différent sur autres)
+  - Cache hit / miss
+  - TTL (expiration)
+  - Invalidation explicite
+  - Éviction LRU
+  - Thread-safety basique
+"""
+
+from __future__ import annotations
+
+import threading
+import time
+from datetime import datetime
+from pathlib import Path
+
+import pytest
+from PIL import Image
+
+from core.models.screen_state import (
+    ContextLevel,
+    EmbeddingRef,
+    PerceptionLevel,
+    RawLevel,
+    ScreenState,
+    WindowContext,
+)
+from core.pipeline.screen_state_cache import (
+    ScreenStateCache,
+    compute_perceptual_hash,
+)
+
+
+# -----------------------------------------------------------------------------
+# Fixtures
+# -----------------------------------------------------------------------------
+
+
+def _make_screenshot(tmp_path: Path, color: tuple, name: str = "shot.png") -> str:
+    img = Image.new("RGB", (320, 240), color=color)
+    path = tmp_path / name
+    img.save(str(path))
+    return str(path)
+
+
+def _make_state(session_id: str = "s1") -> ScreenState:
+    return ScreenState(
+        screen_state_id=f"state_{datetime.now().strftime('%H%M%S%f')}",
+        timestamp=datetime.now(),
+        session_id=session_id,
+        window=WindowContext(
+            app_name="app", window_title="Title", screen_resolution=[1920, 1080]
+        ),
+        raw=RawLevel(screenshot_path="", capture_method="test", file_size_bytes=0),
+        perception=PerceptionLevel(
+            embedding=EmbeddingRef(provider="t", vector_id="v", dimensions=512),
+            detected_text=[],
+            text_detection_method="none",
+            confidence_avg=0.0,
+        ),
+        context=ContextLevel(),
+        ui_elements=[],
+    )
+
+
+# -----------------------------------------------------------------------------
+# Hash perceptuel
+# -----------------------------------------------------------------------------
+
+
+class TestPerceptualHash:
+
+    def test_deterministic_for_same_image(self, tmp_path):
+        path = _make_screenshot(tmp_path, (255, 0, 0))
+        h1 = compute_perceptual_hash(path)
+        h2 = compute_perceptual_hash(path)
+        assert h1 == h2
+        assert len(h1) == 16  # 8*8 bits = 64 bits = 16 hex chars
+
+    def test_differs_across_images(self, tmp_path):
+        path_red = _make_screenshot(tmp_path, (255, 0, 0), "red.png")
+        path_blue = _make_screenshot(tmp_path, (0, 0, 255), "blue.png")
+        # Note : deux images unies ont le même dhash (toutes différences nulles)
+        # On doit utiliser des images avec un vrai gradient pour différer.
+        grad_red = Image.new("RGB", (320, 240))
+        for x in range(320):
+            for y in range(240):
+                grad_red.putpixel((x, y), (x % 256, 0, 0))
+        grad_path = tmp_path / "grad_red.png"
+        grad_red.save(str(grad_path))
+
+        h_red = compute_perceptual_hash(path_red)
+        h_grad = compute_perceptual_hash(str(grad_path))
+        assert h_red != h_grad
+
+    def test_robust_to_missing_file(self, tmp_path):
+        # Chemin inexistant → fallback mais pas de crash
+        h = compute_perceptual_hash(str(tmp_path / "does_not_exist.png"))
+        assert isinstance(h, str)
+        assert len(h) > 0
+
+
+# -----------------------------------------------------------------------------
+# Cache
+# -----------------------------------------------------------------------------
+
+
+class TestScreenStateCache:
+
+    def test_get_or_compute_cache_miss_then_hit(self, tmp_path):
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        path = _make_screenshot(tmp_path, (100, 100, 100))
+
+        calls = []
+
+        def compute(p):
+            calls.append(p)
+            return _make_state()
+
+        s1, hit1, _ = cache.get_or_compute(path, compute)
+        s2, hit2, _ = cache.get_or_compute(path, compute)
+
+        assert hit1 is False
+        assert hit2 is True
+        assert len(calls) == 1
+        assert s1 is s2  # Même objet retourné
+
+    def test_ttl_expiration(self, tmp_path):
+        cache = ScreenStateCache(ttl_seconds=0.1)
+        path = _make_screenshot(tmp_path, (50, 50, 50))
+
+        def compute(_):
+            return _make_state()
+
+        cache.get_or_compute(path, compute)
+        time.sleep(0.15)
+        _, hit, _ = cache.get_or_compute(path, compute)
+        assert hit is False  # Expiré
+
+    def test_force_refresh_bypasses_cache(self, tmp_path):
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        path = _make_screenshot(tmp_path, (10, 10, 10))
+        cache.get_or_compute(path, lambda _: _make_state())
+        _, hit, _ = cache.get_or_compute(
+            path, lambda _: _make_state(), force_refresh=True
+        )
+        assert hit is False
+
+    def test_invalidate_all(self, tmp_path):
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        path = _make_screenshot(tmp_path, (200, 200, 200))
+        cache.get_or_compute(path, lambda _: _make_state())
+        cache.invalidate()
+        _, hit, _ = cache.get_or_compute(path, lambda _: _make_state())
+        assert hit is False
+
+    def test_eviction_lru(self, tmp_path):
+        cache = ScreenStateCache(ttl_seconds=10.0, max_entries=2)
+        # Créer 3 images différentes (gradients différents pour hashes différents)
+        paths = []
+        for i, intensity in enumerate([30, 120, 220]):
+            img = Image.new("RGB", (320, 240))
+            for x in range(320):
+                for y in range(240):
+                    img.putpixel((x, y), ((x + intensity) % 256, intensity, 0))
+            p = tmp_path / f"grad_{i}.png"
+            img.save(str(p))
+            paths.append(str(p))
+
+        def compute(_):
+            return _make_state()
+
+        cache.get_or_compute(paths[0], compute)
+        time.sleep(0.01)
+        cache.get_or_compute(paths[1], compute)
+        time.sleep(0.01)
+        cache.get_or_compute(paths[2], compute)
+        # Le 1er doit avoir été évincé
+        assert len(cache) == 2
+
+    def test_stats(self, tmp_path):
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        path = _make_screenshot(tmp_path, (77, 77, 77))
+        cache.get_or_compute(path, lambda _: _make_state())
+        cache.get_or_compute(path, lambda _: _make_state())
+        stats = cache.stats()
+        assert stats["hits"] == 1
+        assert stats["misses"] == 1
+        assert stats["hit_rate"] == 0.5
+
+    def test_invalidate_if_changed_purges_on_big_change(self, tmp_path):
+        """Un screenshot très différent doit invalider tout le cache."""
+        import random
+
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        # Image 1 : gradient doux
+        img1 = Image.new("RGB", (320, 240))
+        for y in range(240):
+            for x in range(320):
+                img1.putpixel((x, y), (y, y, y))
+        p1 = tmp_path / "v.png"
+        img1.save(str(p1))
+
+        # Image 2 : bruit aléatoire (structure radicalement différente)
+        random.seed(42)
+        img2 = Image.new("RGB", (320, 240))
+        for y in range(240):
+            for x in range(320):
+                v = random.randint(0, 255)
+                img2.putpixel((x, y), (v, v, v))
+        p2 = tmp_path / "noise.png"
+        img2.save(str(p2))
+
+        cache.get_or_compute(str(p1), lambda _: _make_state())
+        assert len(cache) == 1
+
+        purged = cache.invalidate_if_changed(str(p2), threshold=0.3)
+        assert purged is True
+        assert len(cache) == 0
+
+    def test_invalidate_if_changed_keeps_cache_on_small_change(self, tmp_path):
+        """Un screenshot très proche ne doit PAS invalider le cache."""
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        # Même gradient avec un léger bruit
+        img1 = Image.new("RGB", (320, 240))
+        for y in range(240):
+            for x in range(320):
+                img1.putpixel((x, y), ((x + y) % 256, 0, 0))
+        p1 = tmp_path / "a.png"
+        img1.save(str(p1))
+
+        img2 = img1.copy()
+        # Bruit léger : changer seulement quelques pixels
+        for i in range(5):
+            img2.putpixel((i, 0), (255, 255, 255))
+        p2 = tmp_path / "b.png"
+        img2.save(str(p2))
+
+        cache.get_or_compute(str(p1), lambda _: _make_state())
+        purged = cache.invalidate_if_changed(str(p2), threshold=0.3)
+        assert purged is False
+        assert len(cache) == 1
+
+    def test_invalidate_if_changed_empty_cache_is_noop(self, tmp_path):
+        """Sur cache vide, invalidate_if_changed ne doit rien faire."""
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        p = _make_screenshot(tmp_path, (100, 100, 100))
+        purged = cache.invalidate_if_changed(p, threshold=0.3)
+        assert purged is False
+
+    def test_thread_safety(self, tmp_path):
+        """Lecture/écriture concurrentes ne doivent pas crasher."""
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        path = _make_screenshot(tmp_path, (64, 64, 64))
+        errors = []
+
+        def worker():
+            try:
+                for _ in range(20):
+                    cache.get_or_compute(path, lambda _: _make_state())
+            except Exception as e:
+                errors.append(e)
+
+        threads = [threading.Thread(target=worker) for _ in range(5)]
+        for t in threads:
+            t.start()
+        for t in threads:
+            t.join()
+
+        assert not errors
+
+
+# -----------------------------------------------------------------------------
+# Clé composite context-aware (Lot D)
+# -----------------------------------------------------------------------------
+
+
+class TestCacheContextAware:
+    """Lot D — Le cache ne doit jamais hit entre deux contextes différents.
+
+    La clé composite combine 6 éléments : phash, window_title, app_name,
+    enable_ocr, enable_ui_detection, workflow_id. Toute variation sur une
+    de ces dimensions doit produire un cache miss, même si le screenshot
+    (donc le phash) est strictement identique.
+    """
+
+    def test_same_image_different_window_miss(self, tmp_path):
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        path = _make_screenshot(tmp_path, (60, 60, 60))
+
+        _, hit_a, _ = cache.get_or_compute(
+            path,
+            lambda _: _make_state(),
+            window_title="Chrome",
+            app_name="chrome.exe",
+            workflow_id="wf1",
+        )
+        _, hit_b, _ = cache.get_or_compute(
+            path,
+            lambda _: _make_state(),
+            window_title="Firefox",  # Diffère
+            app_name="chrome.exe",
+            workflow_id="wf1",
+        )
+        assert hit_a is False
+        assert hit_b is False  # Contexte fenêtre différent → miss
+
+    def test_same_image_different_app_miss(self, tmp_path):
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        path = _make_screenshot(tmp_path, (90, 90, 90))
+
+        cache.get_or_compute(
+            path,
+            lambda _: _make_state(),
+            window_title="Doc.pdf",
+            app_name="acrobat.exe",
+        )
+        _, hit, _ = cache.get_or_compute(
+            path,
+            lambda _: _make_state(),
+            window_title="Doc.pdf",
+            app_name="sumatra.exe",  # Diffère
+        )
+        assert hit is False  # app_name différent → miss
+
+    def test_same_image_different_flags_miss(self, tmp_path):
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        path = _make_screenshot(tmp_path, (120, 120, 120))
+
+        # Run 1 : OCR actif
+        cache.get_or_compute(
+            path,
+            lambda _: _make_state(),
+            enable_ocr=True,
+            enable_ui_detection=True,
+        )
+        # Run 2 : OCR désactivé → clé différente
+        _, hit_ocr_off, _ = cache.get_or_compute(
+            path,
+            lambda _: _make_state(),
+            enable_ocr=False,
+            enable_ui_detection=True,
+        )
+        # Run 3 : UI désactivé → encore une autre clé
+        _, hit_ui_off, _ = cache.get_or_compute(
+            path,
+            lambda _: _make_state(),
+            enable_ocr=True,
+            enable_ui_detection=False,
+        )
+        assert hit_ocr_off is False
+        assert hit_ui_off is False
+
+    def test_same_image_different_workflow_miss(self, tmp_path):
+        """Isolation stricte inter-workflows : replay wf1 ≠ replay wf2."""
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        path = _make_screenshot(tmp_path, (33, 77, 200))
+
+        cache.get_or_compute(
+            path, lambda _: _make_state(), workflow_id="wf_alpha"
+        )
+        _, hit, _ = cache.get_or_compute(
+            path, lambda _: _make_state(), workflow_id="wf_beta"
+        )
+        assert hit is False
+
+    def test_same_image_same_context_hit(self, tmp_path):
+        """Tout identique → hit (comportement cache nominal)."""
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        path = _make_screenshot(tmp_path, (42, 42, 42))
+
+        kwargs = dict(
+            window_title="Notepad",
+            app_name="notepad.exe",
+            enable_ocr=True,
+            enable_ui_detection=True,
+            workflow_id="wf_stable",
+        )
+        calls = []
+
+        def compute(p):
+            calls.append(p)
+            return _make_state()
+
+        _, hit1, _ = cache.get_or_compute(path, compute, **kwargs)
+        _, hit2, _ = cache.get_or_compute(path, compute, **kwargs)
+        assert hit1 is False
+        assert hit2 is True
+        assert len(calls) == 1
+
+    def test_default_context_is_stable(self, tmp_path):
+        """Rétrocompat : deux callers sans kwargs de contexte partagent
+        la même entrée de cache (ancien comportement préservé)."""
+        cache = ScreenStateCache(ttl_seconds=10.0)
+        path = _make_screenshot(tmp_path, (11, 22, 33))
+
+        calls = []
+
+        def compute(p):
+            calls.append(p)
+            return _make_state()
+
+        # Deux appels sans kwargs → doivent partager la même clé
+        _, hit1, _ = cache.get_or_compute(path, compute)
+        _, hit2, _ = cache.get_or_compute(path, compute)
+        assert hit1 is False
+        assert hit2 is True
+        assert len(calls) == 1
+
+    def test_invalidate_if_changed_ignores_context(self, tmp_path):
+        """invalidate_if_changed regarde le phash seul, pas la clé composite.
+        Un changement visuel majeur purge toutes les entrées, quel que soit
+        leur contexte (workflow, flags, fenêtre)."""
+        import random
+
+        cache = ScreenStateCache(ttl_seconds=10.0)
+
+        # Deux entrées dans des contextes différents MAIS pour la même image.
+        img1 = Image.new("RGB", (320, 240))
+        for y in range(240):
+            for x in range(320):
+                img1.putpixel((x, y), (y, y, y))
+        p1 = tmp_path / "orig.png"
+        img1.save(str(p1))
+
+        cache.get_or_compute(
+            str(p1), lambda _: _make_state(), workflow_id="wf1"
+        )
+        cache.get_or_compute(
+            str(p1), lambda _: _make_state(), workflow_id="wf2"
+        )
+        assert len(cache) == 2
+
+        # Nouveau screenshot radicalement différent → doit tout purger.
+        random.seed(42)
+        img2 = Image.new("RGB", (320, 240))
+        for y in range(240):
+            for x in range(320):
+                v = random.randint(0, 255)
+                img2.putpixel((x, y), (v, v, v))
+        p2 = tmp_path / "noise.png"
+        img2.save(str(p2))
+
+        purged = cache.invalidate_if_changed(str(p2), threshold=0.3)
+        assert purged is True
+        assert len(cache) == 0