741 lines
16 KiB
JSON
741 lines
16 KiB
JSON
{
|
|
"source_file": "CRH 23054001.pdf",
|
|
"total_replacements": 1009,
|
|
"regex_replacements": 312,
|
|
"ner_replacements": 17,
|
|
"sweep_replacements": 680,
|
|
"entities_found": [
|
|
{
|
|
"original": "10110601324",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101096005",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100163277",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101639580",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10004606595",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101480506",
|
|
"replacement": "[RPPS_6]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100858090",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102268702",
|
|
"replacement": "[RPPS_8]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102272209",
|
|
"replacement": "[RPPS_9]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101856135",
|
|
"replacement": "[RPPS_10]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002815024",
|
|
"replacement": "[RPPS_11]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100817005",
|
|
"replacement": "[RPPS_12]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10110601324",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101096005",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100163277",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101639580",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10004606595",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101480506",
|
|
"replacement": "[RPPS_6]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100858090",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102268702",
|
|
"replacement": "[RPPS_8]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102272209",
|
|
"replacement": "[RPPS_9]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101856135",
|
|
"replacement": "[RPPS_10]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002815024",
|
|
"replacement": "[RPPS_11]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100817005",
|
|
"replacement": "[RPPS_12]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10110601324",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101096005",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100163277",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101639580",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10004606595",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101480506",
|
|
"replacement": "[RPPS_6]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100858090",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102268702",
|
|
"replacement": "[RPPS_8]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102272209",
|
|
"replacement": "[RPPS_9]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101856135",
|
|
"replacement": "[RPPS_10]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002815024",
|
|
"replacement": "[RPPS_11]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100817005",
|
|
"replacement": "[RPPS_12]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10110601324",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101096005",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100163277",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101639580",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10004606595",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101480506",
|
|
"replacement": "[RPPS_6]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100858090",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102268702",
|
|
"replacement": "[RPPS_8]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102272209",
|
|
"replacement": "[RPPS_9]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002815024",
|
|
"replacement": "[RPPS_11]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100817005",
|
|
"replacement": "[RPPS_12]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10110601324",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101096005",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100163277",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101639580",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10004606595",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101480506",
|
|
"replacement": "[RPPS_6]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100858090",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102268702",
|
|
"replacement": "[RPPS_8]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102272209",
|
|
"replacement": "[RPPS_9]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101856135",
|
|
"replacement": "[RPPS_10]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002815024",
|
|
"replacement": "[RPPS_11]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100817005",
|
|
"replacement": "[RPPS_12]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10110601324",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101096005",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100163277",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101639580",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10004606595",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101480506",
|
|
"replacement": "[RPPS_6]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100858090",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102268702",
|
|
"replacement": "[RPPS_8]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102272209",
|
|
"replacement": "[RPPS_9]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101856135",
|
|
"replacement": "[RPPS_10]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002815024",
|
|
"replacement": "[RPPS_11]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100817005",
|
|
"replacement": "[RPPS_12]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10110601324",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101096005",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100163277",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101639580",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10004606595",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101480506",
|
|
"replacement": "[RPPS_6]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100858090",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102268702",
|
|
"replacement": "[RPPS_8]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102272209",
|
|
"replacement": "[RPPS_9]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101856135",
|
|
"replacement": "[RPPS_10]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002815024",
|
|
"replacement": "[RPPS_11]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100817005",
|
|
"replacement": "[RPPS_12]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10110601324",
|
|
"replacement": "[RPPS_1]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101096005",
|
|
"replacement": "[RPPS_2]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100163277",
|
|
"replacement": "[RPPS_3]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101639580",
|
|
"replacement": "[RPPS_4]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10004606595",
|
|
"replacement": "[RPPS_5]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101480506",
|
|
"replacement": "[RPPS_6]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100858090",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102268702",
|
|
"replacement": "[RPPS_8]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10102272209",
|
|
"replacement": "[RPPS_9]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10101856135",
|
|
"replacement": "[RPPS_10]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10002815024",
|
|
"replacement": "[RPPS_11]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100817005",
|
|
"replacement": "[RPPS_12]",
|
|
"source": "regex",
|
|
"category": "rpps"
|
|
},
|
|
{
|
|
"original": "10100858090",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "code_barre"
|
|
},
|
|
{
|
|
"original": "10100858090",
|
|
"replacement": "[RPPS_7]",
|
|
"source": "regex",
|
|
"category": "code_barre"
|
|
},
|
|
{
|
|
"original": "secr.medint@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.medint@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.medint@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.medint@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.medint@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.medint@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.medint@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "secr.medint@ch-cotebasque.fr",
|
|
"replacement": "[EMAIL_1]",
|
|
"source": "regex",
|
|
"category": "email"
|
|
},
|
|
{
|
|
"original": "Suzanne DEVAUX",
|
|
"replacement": "[MEDECIN_11]",
|
|
"source": "ner",
|
|
"score": 0.977254331111908
|
|
},
|
|
{
|
|
"original": "[MEDEC",
|
|
"replacement": "[PERSONNE_1]",
|
|
"source": "ner",
|
|
"score": 0.8499495983123779
|
|
},
|
|
{
|
|
"original": "[MEDECIN_59",
|
|
"replacement": "[PERSONNE_2]",
|
|
"source": "ner",
|
|
"score": 0.9779580235481262
|
|
},
|
|
{
|
|
"original": "[MEDECIN_69",
|
|
"replacement": "[PERSONNE_3]",
|
|
"source": "ner",
|
|
"score": 0.965174674987793
|
|
},
|
|
{
|
|
"original": "[MEDECIN_61",
|
|
"replacement": "[PERSONNE_4]",
|
|
"source": "ner",
|
|
"score": 0.9661189913749695
|
|
},
|
|
{
|
|
"original": "LACROIX Fabienne",
|
|
"replacement": "[PERSONNE_5]",
|
|
"source": "ner",
|
|
"score": 0.9854527115821838
|
|
},
|
|
{
|
|
"original": "MEDECIN_",
|
|
"replacement": "[PERSONNE_6]",
|
|
"source": "ner",
|
|
"score": 0.8932056427001953
|
|
},
|
|
{
|
|
"original": "J. LOEB",
|
|
"replacement": "[PERSONNE_7]",
|
|
"source": "ner",
|
|
"score": 0.8495378494262695
|
|
},
|
|
{
|
|
"original": "Irène MACHELART",
|
|
"replacement": "[MEDECIN_7]",
|
|
"source": "ner",
|
|
"score": 0.9984633326530457
|
|
},
|
|
{
|
|
"original": "MARTIN LECAMP Gonzague",
|
|
"replacement": "[SOIGNANT_1]",
|
|
"source": "ner",
|
|
"score": 0.9970604777336121
|
|
},
|
|
{
|
|
"original": "Elisabeth GUINARD",
|
|
"replacement": "[MEDECIN_12]",
|
|
"source": "ner",
|
|
"score": 0.9969264268875122
|
|
},
|
|
{
|
|
"original": "[MEDECIN",
|
|
"replacement": "[PERSONNE_8]",
|
|
"source": "ner",
|
|
"score": 0.9728299975395203
|
|
},
|
|
{
|
|
"original": "[MEDECIN_",
|
|
"replacement": "[PERSONNE_9]",
|
|
"source": "ner",
|
|
"score": 0.9876055717468262
|
|
},
|
|
{
|
|
"original": "Dr [MEDECIN_43",
|
|
"replacement": "[PERSONNE_10]",
|
|
"source": "ner",
|
|
"score": 0.8862084150314331
|
|
},
|
|
{
|
|
"original": "[MEDECIN_51",
|
|
"replacement": "[PERSONNE_11]",
|
|
"source": "ner",
|
|
"score": 0.896079957485199
|
|
},
|
|
{
|
|
"original": "[MEDECIN_52",
|
|
"replacement": "[PERSONNE_12]",
|
|
"source": "ner",
|
|
"score": 0.9500650763511658
|
|
},
|
|
{
|
|
"original": "[MEDECIN_55",
|
|
"replacement": "[PERSONNE_13]",
|
|
"source": "ner",
|
|
"score": 0.9211677312850952
|
|
}
|
|
]
|
|
} |