chore: mise à jour output pipeline (anonymized + structured)

Résultats de re-traitement pipeline v2 sur 261 dossiers.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
dom
2026-03-07 23:14:42 +01:00
parent c73515ac89
commit 13fe9fa666
734 changed files with 157158 additions and 304963 deletions

View File

@@ -0,0 +1,609 @@
{
"source_file": "trackare-00270032-23107113_00270032_23107113.pdf",
"total_replacements": 548,
"regex_replacements": 218,
"ner_replacements": 54,
"sweep_replacements": 276,
"entities_found": [
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "00270032",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23107113",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "640000162",
"replacement": "[FINESS]",
"source": "regex",
"category": "finess"
},
{
"original": "BAYONNE",
"replacement": "[ADRESSE_2]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "POLE MEDECINE INTERNE - MALADIES INFECTIEUSES\nDossier Patient\nDétails des patients",
"replacement": "[PATIENT_2]",
"source": "regex",
"category": "patient"
},
{
"original": "29 RUE BOURGNEUF Ville de résidence: BAYONNE",
"replacement": "[ADRESSE_1]",
"source": "regex",
"category": "adresse"
},
{
"original": "GUILLEMAUD",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9894199371337891
},
{
"original": "Patricia URRUTIA- IRIBARREN(DOUSSEN",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9962841272354126
},
{
"original": "Patricia URRUTIA- IRIBARREN(DOUSSEN",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9975832104682922
},
{
"original": "Patricia URRUTIA- IRIBARREN(DOUSSEN",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9963946342468262
},
{
"original": "Patricia URRUTIA- IRIBARREN(DOUSSEN",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9985029101371765
},
{
"original": "Patricia URRUTIA- IRIBARREN(DOUSSEN",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9906206727027893
},
{
"original": "Patricia URRUTIA- IRIBARREN(DOUSSEN",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9963920712471008
},
{
"original": "SAINT RAYMOND Julie",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9731234908103943
},
{
"original": "Patricia URRUTIA- IRIBARREN",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.8861247897148132
},
{
"original": "VALACICLOVIR",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.8245244026184082
},
{
"original": "VALACICLOVIR",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.8873762488365173
},
{
"original": "Julie GELULE",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.971260666847229
},
{
"original": "Julie GELULE",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9412921071052551
},
{
"original": "Julie",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.886431872844696
},
{
"original": "Julie",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9413624405860901
},
{
"original": "Julie Signé",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9689236283302307
},
{
"original": "Julie S",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9562257528305054
},
{
"original": "VAREIL Marc-Olivier",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.9899236559867859
},
{
"original": "Patricia URRUTIA- IRIBARREN(DOUSSEN",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9989156126976013
},
{
"original": "Patricia URRUTIA- IRIBARREN(DOUSSEN",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.998801589012146
},
{
"original": "Patricia URRUTIA- IRIBARREN(DOUSSEN",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.998906135559082
},
{
"original": "Patricia URRUTIA- IRIBARREN(DOUSSEN",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9988324046134949
},
{
"original": "Patricia URRUTIA- IRIBARREN(DOUSSEN",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9988493323326111
},
{
"original": "Patricia URRUTIA- IRIBARREN(DOUSSEN",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9988656044006348
},
{
"original": "Patricia URRUTIA- IRIBARREN(DOUSSEN)",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9712371826171875
},
{
"original": "Patricia URRUTIA",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9933282732963562
},
{
"original": "VALACICLOVIR",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9641461372375488
},
{
"original": "VALACICLOVIR",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9745568633079529
},
{
"original": "Julie GELULE",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9705016613006592
},
{
"original": "Julie GELULE",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9392681121826172
},
{
"original": "Julie",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.8734278678894043
},
{
"original": "Julie",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9403896927833557
},
{
"original": "Julie Signé",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9686329960823059
},
{
"original": "Julie Signé",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9974875450134277
},
{
"original": "Julie Signé",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9960145354270935
},
{
"original": "VAREIL Marc-Olivier",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.9829892516136169
},
{
"original": "Julie SAINT RAYMOND",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9977169036865234
},
{
"original": "Julie SAINT RAYMOND",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9971593022346497
},
{
"original": "Julie SAINT RAYMOND",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.998344898223877
},
{
"original": "Julie SAINT RAYMOND",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9983274936676025
},
{
"original": "Julie SAINT",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9805227518081665
},
{
"original": "Julie SAINT",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9861031770706177
},
{
"original": "Julie SAINT",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9898198246955872
},
{
"original": "Julie SAINT",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.991865336894989
},
{
"original": "Julie SAINT",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9906991124153137
},
{
"original": "Arnaud",
"replacement": "[MEDECIN_8]",
"source": "ner",
"score": 0.8650139570236206
},
{
"original": "Sarhane",
"replacement": "[PATIENT_1]",
"source": "ner",
"score": 0.9806550145149231
},
{
"original": "Mirentchu",
"replacement": "[MEDECIN_9]",
"source": "ner",
"score": 0.9945974946022034
},
{
"original": "Patricia URRUTIA",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.987453818321228
},
{
"original": "Julie SAINT-RAYMOND",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9900612831115723
},
{
"original": "Julie SAINT",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.8602615594863892
},
{
"original": "Julie SAINT-RAYMOND",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9939961433410645
},
{
"original": "Père Sarhane Redouan",
"replacement": "[PATIENT_1]",
"source": "ner",
"score": 0.9704276323318481
},
{
"original": "Mère Quinou Sylvie",
"replacement": "[CONTACT_1]",
"source": "ner",
"score": 0.9751859903335571
}
]
}