chore: mise à jour output pipeline (anonymized + structured)

Résultats de re-traitement pipeline v2 sur 261 dossiers.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
dom
2026-03-07 23:14:42 +01:00
parent c73515ac89
commit 13fe9fa666
734 changed files with 157158 additions and 304963 deletions

View File

@@ -0,0 +1,15 @@
{
"source_file": "LETTRE DE SORTIE 23074494.pdf",
"total_replacements": 9,
"regex_replacements": 6,
"ner_replacements": 1,
"sweep_replacements": 2,
"entities_found": [
{
"original": "CLEMENTINE",
"replacement": "[PATIENT_1]",
"source": "ner",
"score": 0.9008113741874695
}
]
}

View File

@@ -0,0 +1,591 @@
{
"source_file": "trackare-23008697-23074494_23008697_23074494.pdf",
"total_replacements": 1079,
"regex_replacements": 375,
"ner_replacements": 30,
"sweep_replacements": 674,
"entities_found": [
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23008697",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23074494",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "640000162",
"replacement": "[FINESS]",
"source": "regex",
"category": "finess"
},
{
"original": "99999",
"replacement": "[LIEU_NAISS_2]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "TALHINAS",
"replacement": "[LIEU_NAISS_1]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "CHIRURGIE ORTHOPEDIQUE\nDossier Patient\nDétails des patients",
"replacement": "[PATIENT_2]",
"source": "regex",
"category": "patient"
},
{
"original": "ALVES",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "ALVES",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "CLEMENTINE",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "CLEMENTINE",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "2 CHEMIN PE DE NAVARRE Ville de résidence: BAYONNE",
"replacement": "[ADRESSE_1]",
"source": "regex",
"category": "adresse"
},
{
"original": "GUILLEMAUD GUILLEMAUD GUILLEMAUD",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9955514073371887
},
{
"original": "LAGARRIGUE Juliette",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9903583526611328
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.9979783296585083
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.9983627200126648
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.9987360835075378
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.9911686182022095
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.9982384443283081
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.998572826385498
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.9986976385116577
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.998271644115448
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.9985122680664062
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.9984965324401855
},
{
"original": "Sophie Signé",
"replacement": "[SOIGNANT_2]",
"source": "ner",
"score": 0.9053983688354492
},
{
"original": "LAGARRIGUE Juliette",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9956217408180237
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.9939037561416626
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.9941812753677368
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.9964895248413086
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.9988969564437866
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.99896639585495
},
{
"original": "Fabienne ETCHART",
"replacement": "[SOIGNANT_20]",
"source": "ner",
"score": 0.9973636865615845
},
{
"original": "Charlotte GELULE",
"replacement": "[MEDECIN_2]",
"source": "ner",
"score": 0.8290235996246338
},
{
"original": "Sophie VESSIE DE GLACE",
"replacement": "[SOIGNANT_2]",
"source": "ner",
"score": 0.9596654772758484
},
{
"original": "Laure",
"replacement": "[ADRESSE_3]",
"source": "ner",
"score": 0.819611668586731
},
{
"original": "Elise MARTHIENS",
"replacement": "[MEDECIN_12]",
"source": "ner",
"score": 0.996931791305542
},
{
"original": "Alexandre BLANCO",
"replacement": "[MEDECIN_13]",
"source": "ner",
"score": 0.9958021640777588
},
{
"original": "Alexandre BLANCO",
"replacement": "[MEDECIN_13]",
"source": "ner",
"score": 0.9967115521430969
},
{
"original": "SERINGUE",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9452900886535645
},
{
"original": "Christian SERINGUE",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9071865677833557
},
{
"original": "Yvan HUGUES",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9980290532112122
},
{
"original": "Elise MARTHIENS",
"replacement": "[MEDECIN_12]",
"source": "ner",
"score": 0.9816389083862305
}
]
}