Externalize dictionaries and add anonymization review corpus

This commit is contained in:
2026-04-21 10:32:57 +02:00
parent 012445755a
commit 500ebc28c2
99 changed files with 1805 additions and 805 deletions

View File

@@ -5,6 +5,7 @@ import sys
from pathlib import Path
sys.path.insert(0, str(Path(__file__).parent.parent))
from config_defaults import RUNTIME_DICTIONARIES_CONFIG_PATH
from anonymizer_core_refactored_onnx import process_pdf
# Test sur 3 documents du test dataset
@@ -32,7 +33,7 @@ for doc in test_docs:
out_dir=out_dir,
make_vector_redaction=False,
also_make_raster_burn=False,
config_path=Path("config/dictionnaires.yml"),
config_path=RUNTIME_DICTIONARIES_CONFIG_PATH,
use_hf=False,
ner_manager=None,
vlm_manager=None,
@@ -56,4 +57,3 @@ for doc in test_docs:
print(f"{pdf_path.name}: Erreur - {e}")
print("\n✅ Test terminé")