chore: mise à jour output pipeline (anonymized + structured)

Résultats de re-traitement pipeline v2 sur 261 dossiers.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
This commit is contained in:
dom
2026-03-07 23:14:42 +01:00
parent c73515ac89
commit 13fe9fa666
734 changed files with 157158 additions and 304963 deletions

View File

@@ -0,0 +1,255 @@
{
"source_file": "trackare-05017783-23056475_05017783_23056475.pdf",
"total_replacements": 215,
"regex_replacements": 122,
"ner_replacements": 13,
"sweep_replacements": 80,
"entities_found": [
{
"original": "05017783",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "05017783",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "05017783",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "05017783",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "05017783",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "05017783",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "05017783",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "05017783",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "05017783",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "05017783",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "05017783",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "05017783",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23056475",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23056475",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23056475",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23056475",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23056475",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23056475",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23056475",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23056475",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23056475",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23056475",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23056475",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23056475",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "640000162",
"replacement": "[FINESS]",
"source": "regex",
"category": "finess"
},
{
"original": "MONTBELIARD",
"replacement": "[LIEU_NAISS_1]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "ONCOLOGIE - ONCOLOGIE HC\nDossier Patient\nDétails des patients",
"replacement": "[PATIENT_2]",
"source": "regex",
"category": "patient"
},
{
"original": "21 IMPASSE DES CHENES Ville de résidence: ST MARTIN DE HINX",
"replacement": "[ADRESSE_1]",
"source": "regex",
"category": "adresse"
},
{
"original": "DEROURE BURTIN",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9931824207305908
},
{
"original": "CURUTCHET",
"replacement": "[MEDECIN_8]",
"source": "ner",
"score": 0.8650376200675964
},
{
"original": "Emma ORALE",
"replacement": "[SOIGNANT_6]",
"source": "ner",
"score": 0.9099580645561218
},
{
"original": "Emma ORALE",
"replacement": "[SOIGNANT_6]",
"source": "ner",
"score": 0.8146445751190186
},
{
"original": "Emma CLOT",
"replacement": "[SOIGNANT_6]",
"source": "ner",
"score": 0.9966465830802917
},
{
"original": "Emma CLOT",
"replacement": "[SOIGNANT_6]",
"source": "ner",
"score": 0.9965463280677795
},
{
"original": "Emma CLOT",
"replacement": "[SOIGNANT_6]",
"source": "ner",
"score": 0.9955844879150391
},
{
"original": "Emma CLOT",
"replacement": "[SOIGNANT_6]",
"source": "ner",
"score": 0.9956602454185486
},
{
"original": "Emma CLOT",
"replacement": "[SOIGNANT_6]",
"source": "ner",
"score": 0.940226137638092
},
{
"original": "Emma CLOT",
"replacement": "[SOIGNANT_6]",
"source": "ner",
"score": 0.8860046863555908
},
{
"original": "Troisier",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.8182731866836548
},
{
"original": "Emma CLOT",
"replacement": "[SOIGNANT_6]",
"source": "ner",
"score": 0.9464282989501953
},
{
"original": "Jean Monnet",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9905607104301453
}
]
}