chore: mise à jour output pipeline (anonymized + structured)

Résultats de re-traitement pipeline v2 sur 261 dossiers.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
dom
2026-03-07 23:14:42 +01:00
parent c73515ac89
commit 13fe9fa666
734 changed files with 157158 additions and 304963 deletions

View File

@@ -0,0 +1,15 @@
{
"source_file": "CRO 23036651.pdf",
"total_replacements": 16,
"regex_replacements": 11,
"ner_replacements": 1,
"sweep_replacements": 4,
"entities_found": [
{
"original": "Ma LAJUS",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9599738717079163
}
]
}

View File

@@ -0,0 +1,813 @@
{
"source_file": "trackare-23002933-23036651_23002933_23036651.pdf",
"total_replacements": 901,
"regex_replacements": 439,
"ner_replacements": 61,
"sweep_replacements": 401,
"entities_found": [
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23002933",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23036651",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "281124008801353",
"replacement": "[NIR_1]",
"source": "regex",
"category": "nir"
},
{
"original": "640000162",
"replacement": "[FINESS]",
"source": "regex",
"category": "finess"
},
{
"original": "40088",
"replacement": "[LIEU_NAISS_2]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "DAX",
"replacement": "[LIEU_NAISS_1]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "LAGUERRE Daniel",
"replacement": "[MEDECIN_1]",
"source": "regex",
"category": "patient"
},
{
"original": "NEURO CHIRURGIE - NEURO-CHIRURGIE\nDossier Patient\nDétails des patients",
"replacement": "[PATIENT_2]",
"source": "regex",
"category": "patient"
},
{
"original": "LAJUS",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "LAJUS",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "ELODIE",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "ELODIE",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "56 IMPASSE HALIHA Ville de résidence: PEYREHORADE",
"replacement": "[ADRESSE_1]",
"source": "regex",
"category": "adresse"
},
{
"original": "GUILLEMAUD",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9968613982200623
},
{
"original": "MARCHAL Claire Signé",
"replacement": "[SOIGNANT_2]",
"source": "ner",
"score": 0.9087808728218079
},
{
"original": "GLYCEMIE CAPILLAIRE",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9953942894935608
},
{
"original": "GLYCEMIE CAPILLAIRE",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.993009090423584
},
{
"original": "GLYCEMIE CAPILLAIRE",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9981397390365601
},
{
"original": "GLYCEMIE CAPILLAIRE",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9973645806312561
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.997568666934967
},
{
"original": "PONTIER Bénédicte S",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9530795812606812
},
{
"original": "MARCHAL Claire S",
"replacement": "[SOIGNANT_2]",
"source": "ner",
"score": 0.9131227731704712
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_15]",
"source": "ner",
"score": 0.9982884526252747
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_15]",
"source": "ner",
"score": 0.9962233304977417
},
{
"original": "SOL LARROUY Pascale",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.8998889923095703
},
{
"original": "LARROUY Pascale",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.8566805124282837
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9965806007385254
},
{
"original": "HYDROCORTISONE ROUSS 10MG PONTIER Bénédicte",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9946969151496887
},
{
"original": "HYDROCORTISONE ROUSS 10MG PONTIER Bénédicte",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9885594844818115
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9526235461235046
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9894489645957947
},
{
"original": "PONTIER Bénédicte Glyc",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.8898442387580872
},
{
"original": "MARCHAL Claire",
"replacement": "[SOIGNANT_2]",
"source": "ner",
"score": 0.9725657105445862
},
{
"original": "GLYCEMIE CAPILLAIRE",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9972636699676514
},
{
"original": "GLYCEMIE CAPILLAIRE",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9967857599258423
},
{
"original": "GLYCEMIE CAPILLAIRE",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9958333969116211
},
{
"original": "GLYCEMIE CAPILLAIRE",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9927635788917542
},
{
"original": "GLYCEMIE CAPILLAIRE",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9589743614196777
},
{
"original": "MARCHAL Claire S",
"replacement": "[SOIGNANT_2]",
"source": "ner",
"score": 0.8102717399597168
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9977118372917175
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_15]",
"source": "ner",
"score": 0.998565673828125
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_15]",
"source": "ner",
"score": 0.9990689158439636
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_15]",
"source": "ner",
"score": 0.9990503191947937
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_15]",
"source": "ner",
"score": 0.9974215626716614
},
{
"original": "PONTIER Bénédicte S",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9291247725486755
},
{
"original": "LANSOPRAZOLE BGA",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9504513740539551
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9265763163566589
},
{
"original": "HYDROCORTISONE ROUSS",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.976944625377655
},
{
"original": "MG PONTIER Bénédicte",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9928484559059143
},
{
"original": "HYDROCORTISONE ROUSS",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.998754620552063
},
{
"original": "MG PONTIER Bénédicte C",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9003084897994995
},
{
"original": "HYDROCORTISONE ROUSS",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.998772382736206
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9889269471168518
},
{
"original": "Mylène",
"replacement": "[MEDECIN_14]",
"source": "ner",
"score": 0.8728764653205872
},
{
"original": "Jean Alexis",
"replacement": "[SOIGNANT_15]",
"source": "ner",
"score": 0.8759884834289551
},
{
"original": "Joelle",
"replacement": "[SOIGNANT_14]",
"source": "ner",
"score": 0.8931033611297607
},
{
"original": "Joelle",
"replacement": "[SOIGNANT_14]",
"source": "ner",
"score": 0.8416308164596558
},
{
"original": "Joelle",
"replacement": "[SOIGNANT_14]",
"source": "ner",
"score": 0.8764015436172485
},
{
"original": "Jean Alexis",
"replacement": "[SOIGNANT_15]",
"source": "ner",
"score": 0.9541465640068054
},
{
"original": "Jean Alexis",
"replacement": "[SOIGNANT_15]",
"source": "ner",
"score": 0.864726185798645
},
{
"original": "Joelle Réalisé",
"replacement": "[SOIGNANT_14]",
"source": "ner",
"score": 0.8551164269447327
},
{
"original": "Emeline SONDE VESICALE",
"replacement": "[MEDECIN_15]",
"source": "ner",
"score": 0.8660532832145691
},
{
"original": "Bénédicte",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.8739981055259705
},
{
"original": "Claire Arrêté",
"replacement": "[SOIGNANT_2]",
"source": "ner",
"score": 0.8546556234359741
},
{
"original": "Joelle PO",
"replacement": "[SOIGNANT_14]",
"source": "ner",
"score": 0.9329983592033386
},
{
"original": "Claire Signé",
"replacement": "[SOIGNANT_2]",
"source": "ner",
"score": 0.9795284271240234
},
{
"original": "Claire Signé",
"replacement": "[SOIGNANT_2]",
"source": "ner",
"score": 0.9943854808807373
},
{
"original": "Claire Signé",
"replacement": "[SOIGNANT_2]",
"source": "ner",
"score": 0.995259702205658
},
{
"original": "Claire Signé",
"replacement": "[SOIGNANT_2]",
"source": "ner",
"score": 0.9836132526397705
},
{
"original": "ALIMENTATION",
"replacement": "[PERSONNE_4]",
"source": "ner",
"score": 0.9854951500892639
},
{
"original": "Bénédicte DE L",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9647437930107117
},
{
"original": "Joelle Signé",
"replacement": "[SOIGNANT_14]",
"source": "ner",
"score": 0.979009747505188
},
{
"original": "Dr DL",
"replacement": "[PERSONNE_5]",
"source": "ner",
"score": 0.82045978307724
},
{
"original": "Marie Mère",
"replacement": "[PATIENT_1]",
"source": "ner",
"score": 0.9022787809371948
}
]
}