chore: mise à jour output pipeline (anonymized + structured)

Résultats de re-traitement pipeline v2 sur 261 dossiers.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
dom
2026-03-07 23:14:42 +01:00
parent c73515ac89
commit 13fe9fa666
734 changed files with 157158 additions and 304963 deletions

View File

@@ -0,0 +1,993 @@
{
"source_file": "trackare-09013298-23103327_09013298_23103327.pdf",
"total_replacements": 759,
"regex_replacements": 321,
"ner_replacements": 99,
"sweep_replacements": 339,
"entities_found": [
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "09013298",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23103327",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "640000162",
"replacement": "[FINESS]",
"source": "regex",
"category": "finess"
},
{
"original": "99999",
"replacement": "[LIEU_NAISS_2]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "BAYONNE",
"replacement": "[LIEU_NAISS_1]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "CHIRURGIE VISCERALE - CHIRURGIE VISCERALE\nDossier Patient\nDétails des patients",
"replacement": "[MEDECIN_10]",
"source": "regex",
"category": "patient"
},
{
"original": "RUIZ",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "RUIZ",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "BERNARD",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "BERNARD",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "VILLA MENDI LOREA 19 BIS RUE DELBARRE Ville de résidence: CAMBO LES BAINS",
"replacement": "[ADRESSE_1]",
"source": "regex",
"category": "adresse"
},
{
"original": "Anne Marie ETCHELECU",
"replacement": "[MEDECIN_16]",
"source": "ner",
"score": 0.9878856539726257
},
{
"original": "Anne Marie ETCHELECU",
"replacement": "[MEDECIN_16]",
"source": "ner",
"score": 0.9986512660980225
},
{
"original": "Anne Marie ETCHELECU",
"replacement": "[MEDECIN_16]",
"source": "ner",
"score": 0.9983162879943848
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9971495866775513
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9988296627998352
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9988391995429993
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9914494752883911
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9989226460456848
},
{
"original": "Mayalen FOURCADE",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9989750385284424
},
{
"original": "Mayalen FOURCADE",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9978576302528381
},
{
"original": "Mayalen FOURCADE",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.998502790927887
},
{
"original": "Mayalen FOURCADE",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9984354972839355
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9982832670211792
},
{
"original": "Mayalen FOURCADE",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9988005757331848
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9988463521003723
},
{
"original": "Mayalen FOURCADE",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9989578127861023
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.9932489395141602
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.989704430103302
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.9898573756217957
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.9856095314025879
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.9939169883728027
},
{
"original": "LARROUY Pascale",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9815130233764648
},
{
"original": "PONTIER Bénédicte S",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.976274847984314
},
{
"original": "LARROUY Pascale",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9321318864822388
},
{
"original": "LARROUY Pascale",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9340947270393372
},
{
"original": "LARROUY Pascale",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9429000616073608
},
{
"original": "GLYCEMIE CAPILLAIRE",
"replacement": "[MEDECIN_9]",
"source": "ner",
"score": 0.9897972345352173
},
{
"original": "GLYCEMIE CAPILLAIRE",
"replacement": "[MEDECIN_9]",
"source": "ner",
"score": 0.8429403305053711
},
{
"original": "GLYCEMIE CAPILLAIRE",
"replacement": "[MEDECIN_9]",
"source": "ner",
"score": 0.8999811410903931
},
{
"original": "Anne Marie ETCHELECU",
"replacement": "[MEDECIN_16]",
"source": "ner",
"score": 0.9958069920539856
},
{
"original": "Anne Marie ETCHELECU",
"replacement": "[MEDECIN_16]",
"source": "ner",
"score": 0.9987487196922302
},
{
"original": "Anne Marie ETCHELECU",
"replacement": "[MEDECIN_16]",
"source": "ner",
"score": 0.9981417059898376
},
{
"original": "Anne Marie ETCHELECU",
"replacement": "[MEDECIN_16]",
"source": "ner",
"score": 0.9975035786628723
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.9951545596122742
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9927604794502258
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9974291920661926
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9988921284675598
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9987555742263794
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9984744787216187
},
{
"original": "Mayalen FOURCADE",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9987881779670715
},
{
"original": "Mayalen FOURCADE",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9980058670043945
},
{
"original": "Mayalen FOURCADE",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9980677962303162
},
{
"original": "Mayalen FOURCADE",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9991288781166077
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9988998174667358
},
{
"original": "Mayalen FOURCADE",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9991307854652405
},
{
"original": "Jean Alexis BARREAU",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9962884783744812
},
{
"original": "Mayalen",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9620521068572998
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.9686844348907471
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.989704430103302
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.9898573756217957
},
{
"original": "PONTIER Bénédicte",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.9765855669975281
},
{
"original": "PONTIER Bénédicte Signé",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.9693724513053894
},
{
"original": "LARROUY Pascale",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9719232320785522
},
{
"original": "Paul Jean Signé",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9852433204650879
},
{
"original": "Paul Jean 100MG",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.8550976514816284
},
{
"original": "Paul Jean Réalisé",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9636087417602539
},
{
"original": "Paul Jean SO",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.8122854232788086
},
{
"original": "Paul Jean Signé",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.897781252861023
},
{
"original": "Paul Jean Signé",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9383000135421753
},
{
"original": "Paul Jean",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9672494530677795
},
{
"original": "Paul Jean",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9716664552688599
},
{
"original": "Paul Jean",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9636292457580566
},
{
"original": "Paul Jean",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9744236469268799
},
{
"original": "Paul Jean",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9568382501602173
},
{
"original": "Paul Jean Signé",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9508012533187866
},
{
"original": "Paul Jean S",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.8876628875732422
},
{
"original": "Paul Jean",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9540448188781738
},
{
"original": "MATERNOWSKI CUTANEE",
"replacement": "[SOIGNANT_7]",
"source": "ner",
"score": 0.9509925246238708
},
{
"original": "Paul Jean SOUS- S",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.8352255821228027
},
{
"original": "Joelle URINAL",
"replacement": "[SOIGNANT_10]",
"source": "ner",
"score": 0.968960165977478
},
{
"original": "Jean Alexis",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9335473775863647
},
{
"original": "Jean Alexis",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9519494771957397
},
{
"original": "Jean Alexis SOMMEIL",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.8088513016700745
},
{
"original": "Joelle SOMMEIL",
"replacement": "[SOIGNANT_10]",
"source": "ner",
"score": 0.8512681126594543
},
{
"original": "Jean Alexis",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9909836053848267
},
{
"original": "Mayalen",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9931325912475586
},
{
"original": "Jean Alexis",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9865325689315796
},
{
"original": "Mayalen",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9972677230834961
},
{
"original": "Jean Alexis",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.8845009803771973
},
{
"original": "Mayalen",
"replacement": "[SOIGNANT_3]",
"source": "ner",
"score": 0.9975844621658325
},
{
"original": "Paul Jean",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9782352447509766
},
{
"original": "Paul Jean MATERNOWSKI",
"replacement": "[SOIGNANT_7]",
"source": "ner",
"score": 0.9955620765686035
},
{
"original": "Paul Jean MATERNOWSKI",
"replacement": "[SOIGNANT_7]",
"source": "ner",
"score": 0.9931632876396179
},
{
"original": "Paul Jean MATERNOWSKI",
"replacement": "[SOIGNANT_7]",
"source": "ner",
"score": 0.9990509748458862
},
{
"original": "Paul Jean MATERNOWSKI",
"replacement": "[SOIGNANT_7]",
"source": "ner",
"score": 0.9988960027694702
},
{
"original": "Paul Jean MATERNOWSKI",
"replacement": "[SOIGNANT_7]",
"source": "ner",
"score": 0.9989871978759766
},
{
"original": "Paul Jean MATERNOWSKI",
"replacement": "[SOIGNANT_7]",
"source": "ner",
"score": 0.9989790320396423
},
{
"original": "Marion PUJOS",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9786112308502197
},
{
"original": "Gautier HERVIEUX",
"replacement": "[MEDECIN_13]",
"source": "ner",
"score": 0.9973151087760925
},
{
"original": "Gautier FLESTOUCH",
"replacement": "[MEDECIN_13]",
"source": "ner",
"score": 0.9983919858932495
},
{
"original": "Paul Jean",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9127732515335083
},
{
"original": "Paul Jean",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.8871574401855469
},
{
"original": "Paul Jean",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9310002326965332
},
{
"original": "Paul Jean",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.8880269527435303
},
{
"original": "Paul Jean",
"replacement": "[SOIGNANT_11]",
"source": "ner",
"score": 0.9261118769645691
},
{
"original": "MATERNOWSKI",
"replacement": "[SOIGNANT_7]",
"source": "ner",
"score": 0.9485020637512207
},
{
"original": "BACHOFFER",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.8403929471969604
},
{
"original": "Tomas AINCIART",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9842341542243958
},
{
"original": "Kattina ARTOLA",
"replacement": "[PERSONNE_4]",
"source": "ner",
"score": 0.909594714641571
}
]
}