chore: mise à jour output pipeline (anonymized + structured)

Résultats de re-traitement pipeline v2 sur 261 dossiers.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
dom
2026-03-07 23:14:42 +01:00
parent c73515ac89
commit 13fe9fa666
734 changed files with 157158 additions and 304963 deletions

View File

@@ -0,0 +1,21 @@
{
"source_file": "CONSULTATION ANESTHESISTE 23042633.pdf",
"total_replacements": 17,
"regex_replacements": 16,
"ner_replacements": 0,
"sweep_replacements": 1,
"entities_found": [
{
"original": "N° Tél :",
"replacement": "[ADRESSE_1]",
"source": "regex",
"category": "adresse"
},
{
"original": "N° Tél :",
"replacement": "[ADRESSE_1]",
"source": "regex",
"category": "adresse"
}
]
}

View File

@@ -0,0 +1,327 @@
{
"source_file": "trackare-BA143366-23042633_BA143366_23042633.pdf",
"total_replacements": 770,
"regex_replacements": 254,
"ner_replacements": 30,
"sweep_replacements": 486,
"entities_found": [
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23042633",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "640000162",
"replacement": "[FINESS]",
"source": "regex",
"category": "finess"
},
{
"original": "NANTES",
"replacement": "[LIEU_NAISS_1]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "CHIRURGIE VISCERALE - CHIRURGIE VASCULAIRE THORACIQ\nDossier Patient\nDétails des patients",
"replacement": "[PATIENT_2]",
"source": "regex",
"category": "patient"
},
{
"original": "7 AVENUE LAMOTHE Ville de résidence: BAYONNE",
"replacement": "[ADRESSE_1]",
"source": "regex",
"category": "adresse"
},
{
"original": "THORACIQ",
"replacement": "[PATIENT_2]",
"source": "ner",
"score": 0.8464211821556091
},
{
"original": "CUGNIN Nina",
"replacement": "[MEDECIN_3]",
"source": "ner",
"score": 0.9005873203277588
},
{
"original": "THORACIQ",
"replacement": "[PATIENT_2]",
"source": "ner",
"score": 0.8541287779808044
},
{
"original": "CUGNIN Nina S",
"replacement": "[MEDECIN_3]",
"source": "ner",
"score": 0.9582687616348267
},
{
"original": "CUGNIN Nina",
"replacement": "[MEDECIN_3]",
"source": "ner",
"score": 0.8894662261009216
},
{
"original": "THORACIQ",
"replacement": "[PATIENT_2]",
"source": "ner",
"score": 0.836461067199707
},
{
"original": "LANSOPRAZOLE",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.8621206879615784
},
{
"original": "INEGY",
"replacement": "[MEDECIN_11]",
"source": "ner",
"score": 0.8603823184967041
},
{
"original": "CUGNIN Nina S",
"replacement": "[MEDECIN_3]",
"source": "ner",
"score": 0.9516347050666809
},
{
"original": "Alessandro",
"replacement": "[MEDECIN_1]",
"source": "ner",
"score": 0.9910129904747009
},
{
"original": "Alessandro",
"replacement": "[MEDECIN_1]",
"source": "ner",
"score": 0.8953914642333984
},
{
"original": "Alessandro",
"replacement": "[MEDECIN_1]",
"source": "ner",
"score": 0.8304948806762695
},
{
"original": "Alessandro ORALE",
"replacement": "[MEDECIN_1]",
"source": "ner",
"score": 0.9939954876899719
},
{
"original": "Alessandro",
"replacement": "[MEDECIN_1]",
"source": "ner",
"score": 0.9872381687164307
},
{
"original": "Alessandro",
"replacement": "[MEDECIN_1]",
"source": "ner",
"score": 0.96142578125
},
{
"original": "Alessandro",
"replacement": "[MEDECIN_1]",
"source": "ner",
"score": 0.9597396850585938
},
{
"original": "Alessandro",
"replacement": "[MEDECIN_1]",
"source": "ner",
"score": 0.9578719139099121
},
{
"original": "FALCHETTI",
"replacement": "[MEDECIN_1]",
"source": "ner",
"score": 0.9666749835014343
},
{
"original": "Alessandro",
"replacement": "[MEDECIN_1]",
"source": "ner",
"score": 0.9830695986747742
},
{
"original": "Alessandro",
"replacement": "[MEDECIN_1]",
"source": "ner",
"score": 0.9873125553131104
},
{
"original": "Alessandro COMP",
"replacement": "[MEDECIN_1]",
"source": "ner",
"score": 0.8112282752990723
},
{
"original": "Alessandro Presc.",
"replacement": "[MEDECIN_1]",
"source": "ner",
"score": 0.908183753490448
},
{
"original": "Marion PUJOS",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9935529232025146
},
{
"original": "Marion PUJOS",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9974419474601746
},
{
"original": "Marion PUJOS",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9967696070671082
},
{
"original": "Marion PUJOS",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9974474310874939
},
{
"original": "Nolwenn BARRE",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9972164630889893
},
{
"original": "Nolwenn BARRE",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.996601402759552
},
{
"original": "Tricard Isabelle",
"replacement": "[PERSONNE_4]",
"source": "ner",
"score": 0.9660103917121887
},
{
"original": "Pannecau",
"replacement": "[ADRESSE_2]",
"source": "ner",
"score": 0.8852323293685913
}
]
}