chore: mise à jour output pipeline (anonymized + structured)

Résultats de re-traitement pipeline v2 sur 261 dossiers.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
dom
2026-03-07 23:14:42 +01:00
parent c73515ac89
commit 13fe9fa666
734 changed files with 157158 additions and 304963 deletions

View File

@@ -0,0 +1,63 @@
{
"source_file": "BACTERIO 23069373.pdf",
"total_replacements": 22,
"regex_replacements": 20,
"ner_replacements": 1,
"sweep_replacements": 1,
"entities_found": [
{
"original": "98214460",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "LOPES Cristina",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "LOPES CHIRURGIE VASCULAIRE THORACIQ",
"replacement": "[PATIENT_1]",
"source": "regex",
"category": "patient"
},
{
"original": "07/09/1980",
"replacement": "[DATE_NAISS_1]",
"source": "regex",
"category": "date_naissance"
},
{
"original": "BRIAULT Isabelle\nReçu le",
"replacement": "[SOIGNANT_1]",
"source": "regex",
"category": "soignant"
},
{
"original": "RIVERA Caroline\nPrélevé le",
"replacement": "[SOIGNANT_2]",
"source": "regex",
"category": "soignant"
},
{
"original": "2300137359",
"replacement": "[IDENTIFIANT_1]",
"source": "regex",
"category": "identifiant"
},
{
"original": "23069373",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "Jacques Loëb",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9895591139793396
}
]
}

View File

@@ -0,0 +1,51 @@
{
"source_file": "CONSULTATION ANESTHESISTE 23069373.pdf",
"total_replacements": 16,
"regex_replacements": 12,
"ner_replacements": 3,
"sweep_replacements": 1,
"entities_found": [
{
"original": "23616410",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23616410",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "N° Tél :",
"replacement": "[ADRESSE_1]",
"source": "regex",
"category": "adresse"
},
{
"original": "N° Tél :",
"replacement": "[ADRESSE_1]",
"source": "regex",
"category": "adresse"
},
{
"original": "THERALENE",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.8045068383216858
},
{
"original": "LOPES Cristina",
"replacement": "[PATIENT_1]",
"source": "ner",
"score": 0.9866553544998169
},
{
"original": "LOPES Cristina",
"replacement": "[PATIENT_1]",
"source": "ner",
"score": 0.9929898977279663
}
]
}

View File

@@ -0,0 +1,21 @@
{
"source_file": "CRO 23069373.pdf",
"total_replacements": 11,
"regex_replacements": 7,
"ner_replacements": 2,
"sweep_replacements": 2,
"entities_found": [
{
"original": "Bochra ZAYENE",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9982967376708984
},
{
"original": "Jérémy HENRIOT",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9980157017707825
}
]
}