687 lines
15 KiB
JSON
687 lines
15 KiB
JSON
{
|
|
"source_file": "CRH 23077240.pdf",
|
|
"total_replacements": 403,
|
|
"regex_replacements": 217,
|
|
"ner_replacements": 11,
|
|
"sweep_replacements": 175,
|
|
"entities_found": [
|
|
{
|
|
"original": "23077240",
|
|
"replacement": "[EPISODE_1]",
|
|
"source": "regex",
|
|
"category": "episode"
|
|
},
|
|
{
|
|
"original": "23077240",
|
|
"replacement": "[EPISODE_1]",
|
|
"source": "regex",
|
|
"category": "episode"
|
|
},
|
|
{
|
|
"original": "23077240",
|
|
"replacement": "[EPISODE_1]",
|
|
"source": "regex",
|
|
"category": "episode"
|
|
},
|
|
{
|
|
"original": "23077240",
|
|
"replacement": "[EPISODE_1]",
|
|
"source": "regex",
|
|
"category": "episode"
|
|
},
|
|
{
|
|
"original": "23077240",
|
|
"replacement": "[EPISODE_1]",
|
|
"source": "regex",
|
|
"category": "episode"
|
|
},
|
|
{
|
|
"original": "23077240",
|
|
"replacement": "[EPISODE_1]",
|
|
"source": "regex",
|
|
"category": "episode"
|
|
},
|
|
{
|
|
"original": "10102326468",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100422012",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100673481",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100402527",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002083912",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10004401718",
|
|
"replacement": "[RPPS_6]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10000598366",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102326468",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100422012",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100673481",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100402527",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002083912",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10004401718",
|
|
"replacement": "[RPPS_6]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10000598366",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102326468",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100422012",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100673481",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100402527",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002083912",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10004401718",
|
|
"replacement": "[RPPS_6]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10000598366",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102326468",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100422012",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100673481",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100402527",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002083912",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10004401718",
|
|
"replacement": "[RPPS_6]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10000598366",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102326468",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100422012",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100673481",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100402527",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002083912",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10004401718",
|
|
"replacement": "[RPPS_6]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10000598366",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102326468",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100422012",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100673481",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100402527",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002083912",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10000598366",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002083912",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "code_barre"
|
|
},
|
|
{
|
|
"original": "10002083912",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "code_barre"
|
|
},
|
|
{
|
|
"original": "secr.csmed@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.endocrino@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_2]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "arajot@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_3]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mauzi@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_4]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mgschwind@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_5]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "emauryy@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_6]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "lritz@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_7]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "ddemarsy@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_8]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "sbordes-couecou@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_9]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.csmed@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.endocrino@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_2]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "arajot@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_3]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mauzi@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_4]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mgschwind@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_5]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "emauryy@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_6]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "lritz@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_7]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "ddemarsy@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_8]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "sbordes-couecou@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_9]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.csmed@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.endocrino@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_2]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "arajot@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_3]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mauzi@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_4]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mgschwind@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_5]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "emauryy@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_6]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "lritz@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_7]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "ddemarsy@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_8]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "sbordes-couecou@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_9]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.csmed@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.endocrino@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_2]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "arajot@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_3]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mauzi@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_4]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mgschwind@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_5]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "emauryy@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_6]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "lritz@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_7]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "ddemarsy@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_8]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "sbordes-couecou@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_9]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.csmed@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.endocrino@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_2]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "arajot@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_3]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mauzi@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_4]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mgschwind@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_5]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "emauryy@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_6]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "lritz@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_7]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "ddemarsy@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_8]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "sbordes-couecou@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_9]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.csmed@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.endocrino@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_2]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "arajot@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_3]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mauzi@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_4]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "mgschwind@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_5]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "emauryy@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_6]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "lritz@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_7]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "sbordes-couecou@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_9]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "[MEDEC",
|
|
"replacement": "[PERSONNE_1]",
|
|
"source": "ner",
|
|
"score": 0.839705228805542
|
|
},
|
|
{
|
|
"original": "] RITZ-QUILLACQ Laurence",
|
|
"replacement": "[PERSONNE_2]",
|
|
"source": "ner",
|
|
"score": 0.9693486094474792
|
|
},
|
|
{
|
|
"original": "J. LOEB",
|
|
"replacement": "[PERSONNE_3]",
|
|
"source": "ner",
|
|
"score": 0.9611659049987793
|
|
},
|
|
{
|
|
"original": "[MEDECIN",
|
|
"replacement": "[PERSONNE_4]",
|
|
"source": "ner",
|
|
"score": 0.9916445016860962
|
|
},
|
|
{
|
|
"original": "[MEDECIN_19",
|
|
"replacement": "[PERSONNE_5]",
|
|
"source": "ner",
|
|
"score": 0.8811845183372498
|
|
},
|
|
{
|
|
"original": "QUILLACQ",
|
|
"replacement": "[PERSONNE_6]",
|
|
"source": "ner",
|
|
"score": 0.9621496200561523
|
|
},
|
|
{
|
|
"original": "[MEDECIN_30",
|
|
"replacement": "[PERSONNE_7]",
|
|
"source": "ner",
|
|
"score": 0.9423726797103882
|
|
},
|
|
{
|
|
"original": "[MEDECIN_",
|
|
"replacement": "[PERSONNE_8]",
|
|
"source": "ner",
|
|
"score": 0.9832685589790344
|
|
},
|
|
{
|
|
"original": "[MEDECIN_34",
|
|
"replacement": "[PERSONNE_9]",
|
|
"source": "ner",
|
|
"score": 0.9165102243423462
|
|
},
|
|
{
|
|
"original": "LOUTRE Anne-marie",
|
|
"replacement": "[PATIENT_3]",
|
|
"source": "ner",
|
|
"score": 0.9927999973297119
|
|
},
|
|
{
|
|
"original": "[PATIENT",
|
|
"replacement": "[PERSONNE_10]",
|
|
"source": "ner",
|
|
"score": 0.8683153390884399
|
|
}
|
|
]
|
|
} |