531 lines
12 KiB
JSON
531 lines
12 KiB
JSON
{
|
|
"source_file": "CRH 23100690.pdf",
|
|
"total_replacements": 507,
|
|
"regex_replacements": 215,
|
|
"ner_replacements": 12,
|
|
"sweep_replacements": 280,
|
|
"entities_found": [
|
|
{
|
|
"original": "23100690",
|
|
"replacement": "[EPISODE_1]",
|
|
"source": "regex",
|
|
"category": "episode"
|
|
},
|
|
{
|
|
"original": "23100690",
|
|
"replacement": "[EPISODE_1]",
|
|
"source": "regex",
|
|
"category": "episode"
|
|
},
|
|
{
|
|
"original": "23100690",
|
|
"replacement": "[EPISODE_1]",
|
|
"source": "regex",
|
|
"category": "episode"
|
|
},
|
|
{
|
|
"original": "23100690",
|
|
"replacement": "[EPISODE_1]",
|
|
"source": "regex",
|
|
"category": "episode"
|
|
},
|
|
{
|
|
"original": "23100690",
|
|
"replacement": "[EPISODE_1]",
|
|
"source": "regex",
|
|
"category": "episode"
|
|
},
|
|
{
|
|
"original": "23100690",
|
|
"replacement": "[EPISODE_1]",
|
|
"source": "regex",
|
|
"category": "episode"
|
|
},
|
|
{
|
|
"original": "10100532760",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100532760",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100532760",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100532760",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100532760",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100532760",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002111572",
|
|
"replacement": "[CODE_BARRE_1]",
|
|
"source": "regex",
|
|
"category": "code_barre"
|
|
},
|
|
{
|
|
"original": "10002111572",
|
|
"replacement": "[CODE_BARRE_1]",
|
|
"source": "regex",
|
|
"category": "code_barre"
|
|
},
|
|
{
|
|
"original": "10002111572",
|
|
"replacement": "[CODE_BARRE_1]",
|
|
"source": "regex",
|
|
"category": "code_barre"
|
|
},
|
|
{
|
|
"original": "fprevost@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "boui@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_2]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "dnivet@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_3]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "tkhuong-huu@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_4]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "aguilngar@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_5]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "fgoutorbe@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_6]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mcboudier@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_7]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mbrugel@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_8]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mboube@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_9]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "faudemar@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_10]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "fprevost@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "boui@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_2]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "dnivet@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_3]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "tkhuong-huu@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_4]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "aguilngar@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_5]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "fgoutorbe@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_6]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mcboudier@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_7]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mbrugel@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_8]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mboube@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_9]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "faudemar@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_10]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "fprevost@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "boui@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_2]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "dnivet@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_3]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "tkhuong-huu@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_4]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "aguilngar@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_5]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "fgoutorbe@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_6]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mcboudier@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_7]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mbrugel@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_8]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mboube@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_9]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "faudemar@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_10]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "fprevost@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "boui@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_2]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "dnivet@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_3]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "tkhuong-huu@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_4]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "aguilngar@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_5]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "fgoutorbe@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_6]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mcboudier@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_7]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mbrugel@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_8]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mboube@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_9]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "faudemar@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_10]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "fprevost@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "boui@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_2]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "dnivet@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_3]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "tkhuong-huu@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_4]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "aguilngar@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_5]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "fgoutorbe@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_6]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mcboudier@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_7]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mbrugel@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_8]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mboube@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_9]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "faudemar@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_10]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "fprevost@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "boui@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_2]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "dnivet@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_3]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "tkhuong-huu@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_4]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "aguilngar@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_5]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "fgoutorbe@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_6]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mcboudier@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_7]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mbrugel@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_8]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mboube@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_9]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "faudemar@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_10]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "CHARLES DE GAULLE",
|
|
"replacement": "[PERSONNE_1]",
|
|
"source": "ner",
|
|
"score": 0.9860936999320984
|
|
},
|
|
{
|
|
"original": "Grellety",
|
|
"replacement": "[ADRESSE_2]",
|
|
"source": "ner",
|
|
"score": 0.9852388501167297
|
|
},
|
|
{
|
|
"original": "J. LOEB",
|
|
"replacement": "[PERSONNE_2]",
|
|
"source": "ner",
|
|
"score": 0.9179608821868896
|
|
},
|
|
{
|
|
"original": "PATIENT",
|
|
"replacement": "[MEDECIN]",
|
|
"source": "ner",
|
|
"score": 0.8181775212287903
|
|
},
|
|
{
|
|
"original": "MARTIN Lilian",
|
|
"replacement": "[PATIENT_1]",
|
|
"source": "ner",
|
|
"score": 0.9855286478996277
|
|
},
|
|
{
|
|
"original": "Thomas Grellety",
|
|
"replacement": "[MEDECIN_1]",
|
|
"source": "ner",
|
|
"score": 0.9983272552490234
|
|
},
|
|
{
|
|
"original": "[MEDECIN",
|
|
"replacement": "[PERSONNE_3]",
|
|
"source": "ner",
|
|
"score": 0.9911457300186157
|
|
},
|
|
{
|
|
"original": "[PATIENT_",
|
|
"replacement": "[PERSONNE_4]",
|
|
"source": "ner",
|
|
"score": 0.9011262655258179
|
|
},
|
|
{
|
|
"original": "[MEDECIN_",
|
|
"replacement": "[PERSONNE_5]",
|
|
"source": "ner",
|
|
"score": 0.9595016837120056
|
|
},
|
|
{
|
|
"original": "[MEDECIN_1",
|
|
"replacement": "[PERSONNE_6]",
|
|
"source": "ner",
|
|
"score": 0.9397991895675659
|
|
},
|
|
{
|
|
"original": "[PATIENT_1",
|
|
"replacement": "[PERSONNE_7]",
|
|
"source": "ner",
|
|
"score": 0.8538002371788025
|
|
},
|
|
{
|
|
"original": "[PATIENT_4",
|
|
"replacement": "[PERSONNE_8]",
|
|
"source": "ner",
|
|
"score": 0.9395274519920349
|
|
}
|
|
]
|
|
} |