G3-A câblage moteur réel (engine_bridge.py) : EngineSettings + NerManagers à chargement paresseux (aucun manager à l'import), kwargs alignés CLI/V5 (make_vector_redaction=False, also_make_raster_burn=True, config_path, use_hf, ner/gliner/camembert_manager, ogc_label) ; make_process_fn engine injectable ; état managers not_loaded/loading/ready/unavailable, échecs optionnels tolérés. G3-B Configuration (config_state.py + tabs/tab_config.py) : ConfigState → EngineSettings, profils via profile_defaults (path injectable), options raster/NER local/profil/sortie, état managers, sections admin-only via admin_mode. G3-C Licence UI (machine_id.py + tab_about) : activation par clef (LicenseClient.activate), bouton vérifier (check), affichage statut, aucun token loggé, aucun appel réseau au démarrage (local_status seul). Intégration : tab_usage exécute via le moteur réel selon ConfigState (make_process_fn), anti double-lancement UI. app.py câble Config↔Usage↔licence. G3-D build-prep : anonymisation_gui_v6_onefile.spec (entry V6, customtkinter + modules gui_v6 en hiddenimports). Installateur Anonymisation.iss produit déjà la cible Anonymisation-Setup.exe. Aucun artefact .exe commité ; build Windows à part. Tests +14 (engine_bridge 8, config_state 6). self-test exit 0, 46 tests gui_v6, 193 tests/unit (0 régression). Moteur/V5/specs CLI intacts. Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
185 lines
5.8 KiB
Python
185 lines
5.8 KiB
Python
"""Pont GUI V6 → moteur d'anonymisation (G3-A).
|
|
|
|
Construit les kwargs d'appel du moteur (``process_document``) au plus proche de
|
|
la V5 / du CLI de production, et charge les managers NER **paresseusement** :
|
|
|
|
- aucun manager n'est importé ni instancié à l'import de ce module ;
|
|
- le chargement réel n'a lieu qu'au premier traitement (``ensure_loaded``) ;
|
|
- les factories sont injectables pour les tests (aucun modèle, aucun réseau).
|
|
|
|
Mapping moteur (identique au CLI validé `scripts/anonymize_cli.py`) :
|
|
- ``camembert_manager`` ← CamembertNerManager (NER local principal)
|
|
- ``ner_manager`` ← EdsPseudoManager (optionnel)
|
|
- ``gliner_manager`` ← GlinerManager (optionnel)
|
|
- ``use_hf`` ← True si au moins un manager NER est chargé
|
|
|
|
Aucune logique de détection ici : on orchestre uniquement.
|
|
"""
|
|
|
|
from __future__ import annotations
|
|
|
|
from dataclasses import dataclass
|
|
from enum import Enum
|
|
from pathlib import Path
|
|
from typing import Any, Callable, Optional
|
|
|
|
ProcessFn = Callable[[Path, Path], dict]
|
|
ManagerFactory = Callable[[], Any]
|
|
|
|
|
|
class ManagerState(str, Enum):
|
|
NOT_LOADED = "not_loaded"
|
|
LOADING = "loading"
|
|
READY = "ready"
|
|
UNAVAILABLE = "unavailable"
|
|
|
|
|
|
@dataclass
|
|
class EngineSettings:
|
|
"""Réglages d'appel moteur exposés par l'onglet Configuration."""
|
|
|
|
make_vector_redaction: bool = False
|
|
also_make_raster_burn: bool = True
|
|
config_path: Optional[Path] = None
|
|
use_local_ner: bool = True
|
|
enable_eds: bool = False
|
|
enable_gliner: bool = False
|
|
ogc_label: Optional[str] = None
|
|
profile: Optional[str] = None
|
|
|
|
|
|
def _default_factories() -> dict[str, ManagerFactory]:
|
|
"""Factories par défaut : import paresseux, instanciation + load réels.
|
|
|
|
Définies dans une fonction pour qu'aucun manager ne soit importé à l'import
|
|
de ce module.
|
|
"""
|
|
|
|
def camembert() -> Any:
|
|
from camembert_ner_manager import CamembertNerManager
|
|
|
|
manager = CamembertNerManager()
|
|
manager.load()
|
|
return manager
|
|
|
|
def eds() -> Any:
|
|
from eds_pseudo_manager import EdsPseudoManager
|
|
|
|
manager = EdsPseudoManager()
|
|
manager.load()
|
|
return manager
|
|
|
|
def gliner() -> Any:
|
|
from gliner_manager import GlinerManager
|
|
|
|
manager = GlinerManager()
|
|
manager.load()
|
|
return manager
|
|
|
|
return {"camembert": camembert, "eds": eds, "gliner": gliner}
|
|
|
|
|
|
class NerManagers:
|
|
"""Conteneur de managers NER à chargement paresseux."""
|
|
|
|
def __init__(
|
|
self,
|
|
settings: EngineSettings,
|
|
factories: Optional[dict[str, ManagerFactory]] = None,
|
|
) -> None:
|
|
self._settings = settings
|
|
self._factories = factories if factories is not None else _default_factories()
|
|
self._camembert: Any = None
|
|
self._eds: Any = None
|
|
self._gliner: Any = None
|
|
self._state = ManagerState.NOT_LOADED
|
|
|
|
@property
|
|
def state(self) -> ManagerState:
|
|
return self._state
|
|
|
|
@property
|
|
def use_hf(self) -> bool:
|
|
return bool(self._camembert or self._eds or self._gliner)
|
|
|
|
def as_kwargs(self) -> dict:
|
|
return {
|
|
"ner_manager": self._eds,
|
|
"gliner_manager": self._gliner,
|
|
"camembert_manager": self._camembert,
|
|
}
|
|
|
|
def ensure_loaded(self) -> ManagerState:
|
|
"""Charge les managers requis si nécessaire. Idempotent, sans crash."""
|
|
if not self._settings.use_local_ner:
|
|
self._state = ManagerState.NOT_LOADED
|
|
return self._state
|
|
if self._state == ManagerState.READY:
|
|
return self._state
|
|
|
|
self._state = ManagerState.LOADING
|
|
try:
|
|
# CamemBERT-bio est le NER local principal (obligatoire si NER actif).
|
|
self._camembert = self._factories["camembert"]()
|
|
except Exception:
|
|
self._state = ManagerState.UNAVAILABLE
|
|
return self._state
|
|
|
|
if self._settings.enable_eds:
|
|
try:
|
|
self._eds = self._factories["eds"]()
|
|
except Exception:
|
|
self._eds = None # optionnel : absence tolérée
|
|
if self._settings.enable_gliner:
|
|
try:
|
|
self._gliner = self._factories["gliner"]()
|
|
except Exception:
|
|
self._gliner = None # optionnel : absence tolérée
|
|
|
|
self._state = ManagerState.READY
|
|
return self._state
|
|
|
|
|
|
def build_engine_kwargs(
|
|
settings: EngineSettings, managers: Optional[NerManagers] = None
|
|
) -> dict:
|
|
"""Construit le dict de kwargs passé au moteur."""
|
|
kwargs: dict = {
|
|
"make_vector_redaction": settings.make_vector_redaction,
|
|
"also_make_raster_burn": settings.also_make_raster_burn,
|
|
"config_path": settings.config_path,
|
|
"ogc_label": settings.ogc_label,
|
|
}
|
|
if managers is not None and settings.use_local_ner:
|
|
kwargs.update(managers.as_kwargs())
|
|
kwargs["use_hf"] = managers.use_hf
|
|
else:
|
|
kwargs["use_hf"] = False
|
|
return kwargs
|
|
|
|
|
|
def make_process_fn(
|
|
settings: EngineSettings,
|
|
managers: Optional[NerManagers] = None,
|
|
engine: Optional[Callable[..., dict]] = None,
|
|
) -> ProcessFn:
|
|
"""Retourne un ``process_fn(doc, out_dir)`` câblé au moteur.
|
|
|
|
``engine`` est injectable pour les tests ; par défaut, import paresseux de
|
|
``process_document`` (aucun chargement du moteur à l'import de ce module).
|
|
"""
|
|
managers = managers if managers is not None else NerManagers(settings)
|
|
|
|
def process_fn(doc_path: Path, out_dir: Path) -> dict:
|
|
if settings.use_local_ner:
|
|
managers.ensure_loaded()
|
|
kwargs = build_engine_kwargs(settings, managers)
|
|
run = engine
|
|
if run is None:
|
|
from anonymizer_core_refactored_onnx import process_document
|
|
|
|
run = process_document
|
|
return run(doc_path, out_dir, **kwargs)
|
|
|
|
return process_fn
|