chore: mise à jour output pipeline (anonymized + structured)

Résultats de re-traitement pipeline v2 sur 261 dossiers.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
dom
2026-03-07 23:14:42 +01:00
parent c73515ac89
commit 13fe9fa666
734 changed files with 157158 additions and 304963 deletions

View File

@@ -0,0 +1,801 @@
{
"source_file": "trackare-17008605-23103061_17008605_23103061.pdf",
"total_replacements": 1030,
"regex_replacements": 334,
"ner_replacements": 73,
"sweep_replacements": 623,
"entities_found": [
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "17008605",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103061",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "640000162",
"replacement": "[FINESS]",
"source": "regex",
"category": "finess"
},
{
"original": "99999",
"replacement": "[LIEU_NAISS_2]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "TARRASA",
"replacement": "[LIEU_NAISS_1]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "CHIRURGIE VISCERALE - CHIRURGIE VASCULAIRE THORACIQ\nDossier Patient\nDétails des patients",
"replacement": "[PATIENT_3]",
"source": "regex",
"category": "patient"
},
{
"original": "ADO",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "FONT",
"replacement": "[PATIENT_2]",
"source": "regex",
"category": "patient"
},
{
"original": "TERESA",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "TERESA",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "41 BD VICTOR HUGO Ville de résidence: ST JEAN DE LUZ",
"replacement": "[ADRESSE_1]",
"source": "regex",
"category": "adresse"
},
{
"original": "Iñaki",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9937097430229187
},
{
"original": "Iñaki",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9641836285591125
},
{
"original": "Maialen LANDART",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9990790486335754
},
{
"original": "Maialen LANDART",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9989944100379944
},
{
"original": "Maialen LANDART",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9985485076904297
},
{
"original": "Jules Glyc",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.9932764768600464
},
{
"original": "Maialen LANDART S",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9553439021110535
},
{
"original": "Maialen LANDART",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9990410804748535
},
{
"original": "Maialen LANDART",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9985001087188721
},
{
"original": "BASSIN",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.8932346701622009
},
{
"original": "URINAL",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9220082759857178
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9984788298606873
},
{
"original": "BASSIN",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.8112723231315613
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9980289340019226
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9969644546508789
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9985788464546204
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9986777901649475
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9986012578010559
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9985046982765198
},
{
"original": "THORACIQ",
"replacement": "[PATIENT_3]",
"source": "ner",
"score": 0.8055377006530762
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9930952191352844
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9969999194145203
},
{
"original": "ETCHEVERRY Marie- France",
"replacement": "[CONTACT_1]",
"source": "ner",
"score": 0.9960440993309021
},
{
"original": "Jules",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.9339829683303833
},
{
"original": "Jules 50MG",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.8070316910743713
},
{
"original": "Jules",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.9178861379623413
},
{
"original": "Jules Signé",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.9560039639472961
},
{
"original": "Maialen LANDART",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9987697005271912
},
{
"original": "Maialen LANDART",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9972798824310303
},
{
"original": "Maialen LANDART",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.998546302318573
},
{
"original": "Maialen LANDART",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9987225532531738
},
{
"original": "Maialen LANDART Signé — PLAIE-COLLE",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9561615586280823
},
{
"original": "Maialen LANDART",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9988967776298523
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9978019595146179
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.997433602809906
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9978696703910828
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9975042343139648
},
{
"original": "VIDER",
"replacement": "[PERSONNE_4]",
"source": "ner",
"score": 0.8400055170059204
},
{
"original": "BASSIN",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9462058544158936
},
{
"original": "URINAL",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9445217251777649
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9980554580688477
},
{
"original": "BASSIN",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.8443941473960876
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9979345798492432
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.994988203048706
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9984185695648193
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.997113049030304
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9958553910255432
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9932015538215637
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9983125329017639
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9986751675605774
},
{
"original": "Celine MOUESCA",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9982669353485107
},
{
"original": "ETCHEVERRY Marie- France",
"replacement": "[CONTACT_1]",
"source": "ner",
"score": 0.9849587082862854
},
{
"original": "Jules 50MG",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.9188075661659241
},
{
"original": "Jules 50MG",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.91617351770401
},
{
"original": "Jules Signé",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.9292829036712646
},
{
"original": "Quentin Signé",
"replacement": "[PERSONNE_5]",
"source": "ner",
"score": 0.973935604095459
},
{
"original": "CHANGES",
"replacement": "[PERSONNE_6]",
"source": "ner",
"score": 0.9228538870811462
},
{
"original": "Pascal CHANGE",
"replacement": "[PERSONNE_7]",
"source": "ner",
"score": 0.8763381838798523
},
{
"original": "Marie-",
"replacement": "[SOIGNANT_17]",
"source": "ner",
"score": 0.9375699162483215
},
{
"original": "Maialen",
"replacement": "[SOIGNANT_5]",
"source": "ner",
"score": 0.9670560359954834
},
{
"original": "Celine CHANGES",
"replacement": "[SOIGNANT_19]",
"source": "ner",
"score": 0.9880847930908203
},
{
"original": "Quentin COATSALIOU",
"replacement": "[SOIGNANT_18]",
"source": "ner",
"score": 0.9986432194709778
},
{
"original": "Quentin COATSALIOU",
"replacement": "[SOIGNANT_18]",
"source": "ner",
"score": 0.9987802505493164
},
{
"original": "Quentin COATSALIOU",
"replacement": "[SOIGNANT_18]",
"source": "ner",
"score": 0.9989305734634399
},
{
"original": "Quentin COATSALIOU",
"replacement": "[SOIGNANT_18]",
"source": "ner",
"score": 0.9989043474197388
},
{
"original": "Quentin COATSALIOU",
"replacement": "[SOIGNANT_18]",
"source": "ner",
"score": 0.9987698793411255
},
{
"original": "Quentin COATSALIOU",
"replacement": "[SOIGNANT_18]",
"source": "ner",
"score": 0.9987133741378784
},
{
"original": "Mélanie MALLET",
"replacement": "[SOIGNANT_9]",
"source": "ner",
"score": 0.9978445172309875
},
{
"original": "Mélanie MALLET",
"replacement": "[SOIGNANT_9]",
"source": "ner",
"score": 0.9895050525665283
},
{
"original": "Fatiha CHABANE",
"replacement": "[PERSONNE_8]",
"source": "ner",
"score": 0.9985709190368652
},
{
"original": "larrouy",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9881342053413391
},
{
"original": "larrouy",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9830160737037659
},
{
"original": "larrouy",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9809269905090332
}
]
}