Externalize dictionaries and add anonymization review corpus

This commit is contained in:
2026-04-21 10:32:57 +02:00
parent 012445755a
commit 500ebc28c2
99 changed files with 1805 additions and 805 deletions

View File

@@ -9,6 +9,7 @@ import time
sys.path.insert(0, str(Path(__file__).parent.parent))
import anonymizer_core_refactored_onnx as core
from config_defaults import RUNTIME_DICTIONARIES_CONFIG_PATH
# Dossier de test
test_dir = Path("/tmp/test_gui_pdfs")
@@ -39,7 +40,7 @@ for i, pdf in enumerate(pdfs, start=1):
out_dir=out_dir,
make_vector_redaction=False,
also_make_raster_burn=True,
config_path=Path("config/dictionnaires.yml"),
config_path=RUNTIME_DICTIONARIES_CONFIG_PATH,
use_hf=False,
ner_manager=None,
ner_thresholds=None,