chore: mise à jour output pipeline (anonymized + structured)

Résultats de re-traitement pipeline v2 sur 261 dossiers.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
dom
2026-03-07 23:14:42 +01:00
parent c73515ac89
commit 13fe9fa666
734 changed files with 157158 additions and 304963 deletions

View File

@@ -0,0 +1,39 @@
{
"source_file": "CRH 23096917.pdf",
"total_replacements": 144,
"regex_replacements": 130,
"ner_replacements": 4,
"sweep_replacements": 10,
"entities_found": [
{
"original": "10100829638",
"replacement": "[CODE_BARRE_1]",
"source": "regex",
"category": "code_barre"
},
{
"original": "K. GLADELP",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9972771406173706
},
{
"original": "Douglas",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.8528928756713867
},
{
"original": "MEURINNE",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9955618381500244
},
{
"original": "BONNEAU PEREZ Chiara",
"replacement": "[PATIENT_1]",
"source": "ner",
"score": 0.9924678206443787
}
]
}

View File

@@ -0,0 +1,51 @@
{
"source_file": "CRO 23096917.pdf",
"total_replacements": 15,
"regex_replacements": 5,
"ner_replacements": 7,
"sweep_replacements": 3,
"entities_found": [
{
"original": "Douglas",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.8938594460487366
},
{
"original": "BONNEAU PEREZ",
"replacement": "[ADRESSE_1]",
"source": "ner",
"score": 0.8956999778747559
},
{
"original": "Meckel",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9558639526367188
},
{
"original": "CHIARA BONNEAU PEREZ",
"replacement": "[ADRESSE_1]",
"source": "ner",
"score": 0.9720442295074463
},
{
"original": "Laurence",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9299138784408569
},
{
"original": "ANDRIANAVALOMIONONA",
"replacement": "[PERSONNE_4]",
"source": "ner",
"score": 0.9833140969276428
},
{
"original": "BONNEAU PEREZ",
"replacement": "[ADRESSE_1]",
"source": "ner",
"score": 0.9940961599349976
}
]
}

View File

@@ -0,0 +1,447 @@
{
"source_file": "trackare-23011581-23096917_23011581_23096917.pdf",
"total_replacements": 442,
"regex_replacements": 236,
"ner_replacements": 22,
"sweep_replacements": 184,
"entities_found": [
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23011581",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23096917",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "640000162",
"replacement": "[FINESS]",
"source": "regex",
"category": "finess"
},
{
"original": "99999",
"replacement": "[LIEU_NAISS_1]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "TOULOUSE",
"replacement": "[ADRESSE_2]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "BONNEAU PEREZ",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "MEDECINE PEDIATRIE - PEDIATRIE CHIRURGIE\nDossier Patient\nDétails des patients",
"replacement": "[MEDECIN_8]",
"source": "regex",
"category": "patient"
},
{
"original": "BONNEAU PEREZ",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "CHIARA",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "CHIARA",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "49 RUE DES CHALLETS Ville de résidence: TOULOUSE",
"replacement": "[ADRESSE_1]",
"source": "regex",
"category": "adresse"
},
{
"original": "CHIARA BONNEAU PEREZ",
"replacement": "[PATIENT_1]",
"source": "ner",
"score": 0.995280385017395
},
{
"original": "MIMIAGUE Caroline",
"replacement": "[MEDECIN_14]",
"source": "ner",
"score": 0.9757054448127747
},
{
"original": "Elise Signé",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.9855073690414429
},
{
"original": "Elise Signé",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.9982585310935974
},
{
"original": "Elise Signé",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.9403896927833557
},
{
"original": "PICAMILH Marie- Signé",
"replacement": "[SOIGNANT_10]",
"source": "ner",
"score": 0.8749032020568848
},
{
"original": "PLAIE-COLLE",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.8283377885818481
},
{
"original": "MIMIAGUE Caroline",
"replacement": "[MEDECIN_14]",
"source": "ner",
"score": 0.9641996622085571
},
{
"original": "SALLES Olivia",
"replacement": "[SOIGNANT_8]",
"source": "ner",
"score": 0.8048039078712463
},
{
"original": "Elise Signé",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.9988268613815308
},
{
"original": "Elise Signé",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.9987068176269531
},
{
"original": "Elise",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.9093412160873413
},
{
"original": "PICAMILH Marie- S",
"replacement": "[SOIGNANT_10]",
"source": "ner",
"score": 0.8275143504142761
},
{
"original": "Caroline PLAIE-COLLE",
"replacement": "[MEDECIN_14]",
"source": "ner",
"score": 0.997880756855011
},
{
"original": "Jonathan KT COURT",
"replacement": "[MEDECIN_12]",
"source": "ner",
"score": 0.9976471066474915
},
{
"original": "Jonathan DOULEUR",
"replacement": "[MEDECIN_12]",
"source": "ner",
"score": 0.9927663207054138
},
{
"original": "Christelle REPAS",
"replacement": "[SOIGNANT_9]",
"source": "ner",
"score": 0.9929307103157043
},
{
"original": "Jonathan KT COURT",
"replacement": "[MEDECIN_12]",
"source": "ner",
"score": 0.9532928466796875
},
{
"original": "Emeline GUADAGNIN",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9989246726036072
},
{
"original": "Jonathan OURIOU",
"replacement": "[MEDECIN_12]",
"source": "ner",
"score": 0.9811881184577942
},
{
"original": "Douglas",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.8267942070960999
},
{
"original": "Valentine LAPEGUE",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9638671875
}
]
}