chore: add .gitignore

This commit is contained in:
dom
2026-03-05 00:37:34 +01:00
parent da34bdc8d7
commit d2e0fec97d
2087 changed files with 1485338 additions and 14 deletions

View File

@@ -0,0 +1,621 @@
{
"source_file": "CRH 23106204.pdf",
"total_replacements": 467,
"regex_replacements": 227,
"ner_replacements": 20,
"sweep_replacements": 220,
"entities_found": [
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "10110601324",
"replacement": "[RPPS_1]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101096005",
"replacement": "[RPPS_2]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100163277",
"replacement": "[RPPS_3]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101639580",
"replacement": "[RPPS_4]",
"source": "regex",
"category": "rpps"
},
{
"original": "10004606595",
"replacement": "[RPPS_5]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101480506",
"replacement": "[RPPS_6]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100858090",
"replacement": "[RPPS_7]",
"source": "regex",
"category": "rpps"
},
{
"original": "10102268702",
"replacement": "[RPPS_8]",
"source": "regex",
"category": "rpps"
},
{
"original": "10102272209",
"replacement": "[RPPS_9]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101856135",
"replacement": "[RPPS_10]",
"source": "regex",
"category": "rpps"
},
{
"original": "10002815024",
"replacement": "[RPPS_11]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100817005",
"replacement": "[RPPS_12]",
"source": "regex",
"category": "rpps"
},
{
"original": "10110601324",
"replacement": "[RPPS_1]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101096005",
"replacement": "[RPPS_2]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100163277",
"replacement": "[RPPS_3]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101639580",
"replacement": "[RPPS_4]",
"source": "regex",
"category": "rpps"
},
{
"original": "10004606595",
"replacement": "[RPPS_5]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101480506",
"replacement": "[RPPS_6]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100858090",
"replacement": "[RPPS_7]",
"source": "regex",
"category": "rpps"
},
{
"original": "10102268702",
"replacement": "[RPPS_8]",
"source": "regex",
"category": "rpps"
},
{
"original": "10102272209",
"replacement": "[RPPS_9]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101856135",
"replacement": "[RPPS_10]",
"source": "regex",
"category": "rpps"
},
{
"original": "10002815024",
"replacement": "[RPPS_11]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100817005",
"replacement": "[RPPS_12]",
"source": "regex",
"category": "rpps"
},
{
"original": "10110601324",
"replacement": "[RPPS_1]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101096005",
"replacement": "[RPPS_2]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100163277",
"replacement": "[RPPS_3]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101639580",
"replacement": "[RPPS_4]",
"source": "regex",
"category": "rpps"
},
{
"original": "10004606595",
"replacement": "[RPPS_5]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101480506",
"replacement": "[RPPS_6]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100858090",
"replacement": "[RPPS_7]",
"source": "regex",
"category": "rpps"
},
{
"original": "10102268702",
"replacement": "[RPPS_8]",
"source": "regex",
"category": "rpps"
},
{
"original": "10102272209",
"replacement": "[RPPS_9]",
"source": "regex",
"category": "rpps"
},
{
"original": "10002815024",
"replacement": "[RPPS_11]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100817005",
"replacement": "[RPPS_12]",
"source": "regex",
"category": "rpps"
},
{
"original": "10110601324",
"replacement": "[RPPS_1]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101096005",
"replacement": "[RPPS_2]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100163277",
"replacement": "[RPPS_3]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101639580",
"replacement": "[RPPS_4]",
"source": "regex",
"category": "rpps"
},
{
"original": "10004606595",
"replacement": "[RPPS_5]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101480506",
"replacement": "[RPPS_6]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100858090",
"replacement": "[RPPS_7]",
"source": "regex",
"category": "rpps"
},
{
"original": "10102268702",
"replacement": "[RPPS_8]",
"source": "regex",
"category": "rpps"
},
{
"original": "10102272209",
"replacement": "[RPPS_9]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101856135",
"replacement": "[RPPS_10]",
"source": "regex",
"category": "rpps"
},
{
"original": "10002815024",
"replacement": "[RPPS_11]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100817005",
"replacement": "[RPPS_12]",
"source": "regex",
"category": "rpps"
},
{
"original": "10110601324",
"replacement": "[RPPS_1]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101096005",
"replacement": "[RPPS_2]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100163277",
"replacement": "[RPPS_3]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101639580",
"replacement": "[RPPS_4]",
"source": "regex",
"category": "rpps"
},
{
"original": "10004606595",
"replacement": "[RPPS_5]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101480506",
"replacement": "[RPPS_6]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100858090",
"replacement": "[RPPS_7]",
"source": "regex",
"category": "rpps"
},
{
"original": "10102268702",
"replacement": "[RPPS_8]",
"source": "regex",
"category": "rpps"
},
{
"original": "10102272209",
"replacement": "[RPPS_9]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101856135",
"replacement": "[RPPS_10]",
"source": "regex",
"category": "rpps"
},
{
"original": "10002815024",
"replacement": "[RPPS_11]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100817005",
"replacement": "[RPPS_12]",
"source": "regex",
"category": "rpps"
},
{
"original": "10110601324",
"replacement": "[RPPS_1]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101096005",
"replacement": "[RPPS_2]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100163277",
"replacement": "[RPPS_3]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101639580",
"replacement": "[RPPS_4]",
"source": "regex",
"category": "rpps"
},
{
"original": "10004606595",
"replacement": "[RPPS_5]",
"source": "regex",
"category": "rpps"
},
{
"original": "10101480506",
"replacement": "[RPPS_6]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100858090",
"replacement": "[RPPS_7]",
"source": "regex",
"category": "rpps"
},
{
"original": "10102268702",
"replacement": "[RPPS_8]",
"source": "regex",
"category": "rpps"
},
{
"original": "10102272209",
"replacement": "[RPPS_9]",
"source": "regex",
"category": "rpps"
},
{
"original": "10002815024",
"replacement": "[RPPS_11]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100817005",
"replacement": "[RPPS_12]",
"source": "regex",
"category": "rpps"
},
{
"original": "secr.medint@ch-cotebasque.fr",
"replacement": "[EMAIL_1]",
"source": "regex",
"category": "email"
},
{
"original": "secr.medint@ch-cotebasque.fr",
"replacement": "[EMAIL_1]",
"source": "regex",
"category": "email"
},
{
"original": "secr.medint@ch-cotebasque.fr",
"replacement": "[EMAIL_1]",
"source": "regex",
"category": "email"
},
{
"original": "secr.medint@ch-cotebasque.fr",
"replacement": "[EMAIL_1]",
"source": "regex",
"category": "email"
},
{
"original": "secr.medint@ch-cotebasque.fr",
"replacement": "[EMAIL_1]",
"source": "regex",
"category": "email"
},
{
"original": "secr.medint@ch-cotebasque.fr",
"replacement": "[EMAIL_1]",
"source": "regex",
"category": "email"
},
{
"original": "[MEDECIN_21",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9283413290977478
},
{
"original": "[MEDECIN_47",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9620317220687866
},
{
"original": "Schaeverbeke",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9976910352706909
},
{
"original": "[MEDECIN_49",
"replacement": "[PERSONNE_4]",
"source": "ner",
"score": 0.9668036699295044
},
{
"original": "[MEDECIN_51",
"replacement": "[PERSONNE_5]",
"source": "ner",
"score": 0.9826506972312927
},
{
"original": "[MEDECIN_52",
"replacement": "[PERSONNE_6]",
"source": "ner",
"score": 0.8759320378303528
},
{
"original": "Suzanne DEVAUX",
"replacement": "[MEDECIN_12]",
"source": "ner",
"score": 0.9960212111473083
},
{
"original": "[MEDEC",
"replacement": "[PERSONNE_7]",
"source": "ner",
"score": 0.9052884578704834
},
{
"original": "[MEDECIN",
"replacement": "[PERSONNE_8]",
"source": "ner",
"score": 0.9543776512145996
},
{
"original": "[MEDECIN_29",
"replacement": "[PERSONNE_9]",
"source": "ner",
"score": 0.9553312063217163
},
{
"original": "[MEDECIN_",
"replacement": "[PERSONNE_10]",
"source": "ner",
"score": 0.9908908009529114
},
{
"original": "[MEDECIN_33",
"replacement": "[PERSONNE_11]",
"source": "ner",
"score": 0.884074866771698
},
{
"original": "[MEDECIN_35",
"replacement": "[PERSONNE_12]",
"source": "ner",
"score": 0.9136056900024414
},
{
"original": "Babinski",
"replacement": "[PERSONNE_13]",
"source": "ner",
"score": 0.9957528710365295
},
{
"original": "[MEDECIN_20",
"replacement": "[PERSONNE_14]",
"source": "ner",
"score": 0.8753734230995178
},
{
"original": "[MEDECIN_48",
"replacement": "[PERSONNE_15]",
"source": "ner",
"score": 0.9527720212936401
},
{
"original": "[MEDECIN_26",
"replacement": "[PERSONNE_16]",
"source": "ner",
"score": 0.9303566813468933
},
{
"original": "[MEDECIN_50",
"replacement": "[PERSONNE_17]",
"source": "ner",
"score": 0.9252082109451294
},
{
"original": "GONZALEZ Isabelle",
"replacement": "[PERSONNE_18]",
"source": "ner",
"score": 0.9956825375556946
},
{
"original": "[MEDECIN_34",
"replacement": "[PERSONNE_19]",
"source": "ner",
"score": 0.914669930934906
}
]
}

View File

@@ -0,0 +1,399 @@
{
"source_file": "trackare-BA038066-23106204_BA038066_23106204.pdf",
"total_replacements": 597,
"regex_replacements": 145,
"ner_replacements": 32,
"sweep_replacements": 420,
"entities_found": [
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23106204",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "274126410218232",
"replacement": "[NIR_1]",
"source": "regex",
"category": "nir"
},
{
"original": "274126410218232",
"replacement": "[NIR_1]",
"source": "regex",
"category": "nir"
},
{
"original": "274126410218232",
"replacement": "[NIR_1]",
"source": "regex",
"category": "nir"
},
{
"original": "274126410218232",
"replacement": "[NIR_1]",
"source": "regex",
"category": "nir"
},
{
"original": "640000162",
"replacement": "[FINESS]",
"source": "regex",
"category": "finess"
},
{
"original": "64102",
"replacement": "[LIEU_NAISS_2]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "64102",
"replacement": "[LIEU_NAISS_2]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "64102",
"replacement": "[LIEU_NAISS_2]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "64102",
"replacement": "[LIEU_NAISS_2]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "BAYONNE",
"replacement": "[LIEU_NAISS_1]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "JAOUEN BURTIN BURTIN",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9970154762268066
},
{
"original": "Kappa",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9625274538993835
},
{
"original": "Hutchison",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9971087574958801
},
{
"original": "GONZALEZ",
"replacement": "[PATIENT]",
"source": "ner",
"score": 0.9817298054695129
},
{
"original": "[MEDECIN_",
"replacement": "[PERSONNE_4]",
"source": "ner",
"score": 0.9399986863136292
},
{
"original": "MEDEC",
"replacement": "[PERSONNE_5]",
"source": "ner",
"score": 0.8019065856933594
},
{
"original": "[MEDECIN_32",
"replacement": "[PERSONNE_6]",
"source": "ner",
"score": 0.9755262136459351
},
{
"original": "[MEDECIN",
"replacement": "[PERSONNE_7]",
"source": "ner",
"score": 0.9400013089179993
},
{
"original": "ISABELLE",
"replacement": "[PATIENT]",
"source": "ner",
"score": 0.9621198177337646
},
{
"original": "KHIMMI Sanae",
"replacement": "[PERSONNE_8]",
"source": "ner",
"score": 0.9990296959877014
},
{
"original": "VILLETTE Paul-Emile Signé",
"replacement": "[PERSONNE_9]",
"source": "ner",
"score": 0.9982556104660034
},
{
"original": "VILLETTE Paul-Emile S",
"replacement": "[PERSONNE_10]",
"source": "ner",
"score": 0.9604654908180237
},
{
"original": "VILLETTE Paul-Emile",
"replacement": "[PERSONNE_11]",
"source": "ner",
"score": 0.9941578507423401
},
{
"original": "KHIMMI",
"replacement": "[PERSONNE]",
"source": "ner",
"score": 0.9697656631469727
},
{
"original": "Sanae TOILETTE",
"replacement": "[PERSONNE_12]",
"source": "ner",
"score": 0.8095514178276062
},
{
"original": "Sanae SOMMEIL",
"replacement": "[PERSONNE_13]",
"source": "ner",
"score": 0.9461601376533508
},
{
"original": "BICHAREIL",
"replacement": "[PERSONNE_14]",
"source": "ner",
"score": 0.864852786064148
},
{
"original": "Elina SOMMEIL",
"replacement": "[PERSONNE_15]",
"source": "ner",
"score": 0.8774647116661072
},
{
"original": "Paul-Emile VILLETTE",
"replacement": "[PERSONNE_16]",
"source": "ner",
"score": 0.9987941384315491
},
{
"original": "Paul-Emile",
"replacement": "[PERSONNE]",
"source": "ner",
"score": 0.9810208082199097
},
{
"original": "PARACETAMOL ARW",
"replacement": "[PERSONNE_17]",
"source": "ner",
"score": 0.9146762490272522
},
{
"original": "PANTOPRAZOLE Paul-Emile",
"replacement": "[PERSONNE_18]",
"source": "ner",
"score": 0.9250763058662415
},
{
"original": "MONTELUKAST Paul-Emile ARW",
"replacement": "[PERSONNE_19]",
"source": "ner",
"score": 0.8582585453987122
},
{
"original": "MICROG Paul-Emile",
"replacement": "[PERSONNE_20]",
"source": "ner",
"score": 0.8708341717720032
},
{
"original": "Schaverberke",
"replacement": "[PERSONNE_21]",
"source": "ner",
"score": 0.9982932209968567
},
{
"original": "ARDILOUZE",
"replacement": "[MEDECIN_9]",
"source": "ner",
"score": 0.9545130729675293
},
{
"original": "Humira",
"replacement": "[PERSONNE_22]",
"source": "ner",
"score": 0.968502938747406
},
{
"original": "MEDECIN_",
"replacement": "[PERSONNE_23]",
"source": "ner",
"score": 0.8602863550186157
},
{
"original": "Schaeverbeke",
"replacement": "[PERSONNE_24]",
"source": "ner",
"score": 0.9972837567329407
},
{
"original": "Babinski",
"replacement": "[PERSONNE_25]",
"source": "ner",
"score": 0.9958868026733398
},
{
"original": "Pr Schaeverbeke",
"replacement": "[PERSONNE_26]",
"source": "ner",
"score": 0.9221699237823486
},
{
"original": "Epoux gonzalez xavier",
"replacement": "[CONTACT_1]",
"source": "ner",
"score": 0.8687083721160889
}
]
}