chore: add .gitignore

This commit is contained in:
dom
2026-03-05 00:37:34 +01:00
parent da34bdc8d7
commit d2e0fec97d
2087 changed files with 1485338 additions and 14 deletions

View File

@@ -0,0 +1,57 @@
{
"source_file": "195_23144210 ANAPATH.pdf",
"total_replacements": 23,
"regex_replacements": 14,
"ner_replacements": 8,
"sweep_replacements": 1,
"entities_found": [
{
"original": "JEAN CLAUDE",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.8732696771621704
},
{
"original": "[MEDECIN_",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.951208770275116
},
{
"original": "[MEDECIN_12",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9328235983848572
},
{
"original": "ETCHEVERRY JEAN CLAUDE",
"replacement": "[PERSONNE_4]",
"source": "ner",
"score": 0.9805051684379578
},
{
"original": "Elodie LAURENT",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.9980888962745667
},
{
"original": "Lewis GRECOURT",
"replacement": "[MEDECIN_5]",
"source": "ner",
"score": 0.9984787702560425
},
{
"original": "[MEDECIN",
"replacement": "[PERSONNE_5]",
"source": "ner",
"score": 0.8459715843200684
},
{
"original": "Marie DESROUSSEAUX",
"replacement": "[MEDECIN_3]",
"source": "ner",
"score": 0.9986457824707031
}
]
}

View File

@@ -0,0 +1,369 @@
{
"source_file": "CRH 23144210.pdf",
"total_replacements": 231,
"regex_replacements": 141,
"ner_replacements": 10,
"sweep_replacements": 80,
"entities_found": [
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "10100532760",
"replacement": "[RPPS_1]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100532760",
"replacement": "[RPPS_1]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100532760",
"replacement": "[RPPS_1]",
"source": "regex",
"category": "rpps"
},
{
"original": "10100532760",
"replacement": "[RPPS_1]",
"source": "regex",
"category": "rpps"
},
{
"original": "10002456746",
"replacement": "[CODE_BARRE_1]",
"source": "regex",
"category": "code_barre"
},
{
"original": "10002456746",
"replacement": "[CODE_BARRE_1]",
"source": "regex",
"category": "code_barre"
},
{
"original": "fprevost@ch-cotebasque.fr",
"replacement": "[EMAIL_1]",
"source": "regex",
"category": "email"
},
{
"original": "boui@ch-cotebasque.fr",
"replacement": "[EMAIL_2]",
"source": "regex",
"category": "email"
},
{
"original": "dnivet@ch-cotebasque.fr",
"replacement": "[EMAIL_3]",
"source": "regex",
"category": "email"
},
{
"original": "tkhuong-huu@ch-cotebasque.fr",
"replacement": "[EMAIL_4]",
"source": "regex",
"category": "email"
},
{
"original": "aguilngar@ch-cotebasque.fr",
"replacement": "[EMAIL_5]",
"source": "regex",
"category": "email"
},
{
"original": "fgoutorbe@ch-cotebasque.fr",
"replacement": "[EMAIL_6]",
"source": "regex",
"category": "email"
},
{
"original": "mcboudier@ch-cotebasque.fr",
"replacement": "[EMAIL_7]",
"source": "regex",
"category": "email"
},
{
"original": "mbrugel@ch-cotebasque.fr",
"replacement": "[EMAIL_8]",
"source": "regex",
"category": "email"
},
{
"original": "mboube@ch-cotebasque.fr",
"replacement": "[EMAIL_9]",
"source": "regex",
"category": "email"
},
{
"original": "faudemar@ch-cotebasque.fr",
"replacement": "[EMAIL_10]",
"source": "regex",
"category": "email"
},
{
"original": "fprevost@ch-cotebasque.fr",
"replacement": "[EMAIL_1]",
"source": "regex",
"category": "email"
},
{
"original": "boui@ch-cotebasque.fr",
"replacement": "[EMAIL_2]",
"source": "regex",
"category": "email"
},
{
"original": "dnivet@ch-cotebasque.fr",
"replacement": "[EMAIL_3]",
"source": "regex",
"category": "email"
},
{
"original": "tkhuong-huu@ch-cotebasque.fr",
"replacement": "[EMAIL_4]",
"source": "regex",
"category": "email"
},
{
"original": "aguilngar@ch-cotebasque.fr",
"replacement": "[EMAIL_5]",
"source": "regex",
"category": "email"
},
{
"original": "fgoutorbe@ch-cotebasque.fr",
"replacement": "[EMAIL_6]",
"source": "regex",
"category": "email"
},
{
"original": "mcboudier@ch-cotebasque.fr",
"replacement": "[EMAIL_7]",
"source": "regex",
"category": "email"
},
{
"original": "mbrugel@ch-cotebasque.fr",
"replacement": "[EMAIL_8]",
"source": "regex",
"category": "email"
},
{
"original": "mboube@ch-cotebasque.fr",
"replacement": "[EMAIL_9]",
"source": "regex",
"category": "email"
},
{
"original": "faudemar@ch-cotebasque.fr",
"replacement": "[EMAIL_10]",
"source": "regex",
"category": "email"
},
{
"original": "fprevost@ch-cotebasque.fr",
"replacement": "[EMAIL_1]",
"source": "regex",
"category": "email"
},
{
"original": "boui@ch-cotebasque.fr",
"replacement": "[EMAIL_2]",
"source": "regex",
"category": "email"
},
{
"original": "dnivet@ch-cotebasque.fr",
"replacement": "[EMAIL_3]",
"source": "regex",
"category": "email"
},
{
"original": "tkhuong-huu@ch-cotebasque.fr",
"replacement": "[EMAIL_4]",
"source": "regex",
"category": "email"
},
{
"original": "aguilngar@ch-cotebasque.fr",
"replacement": "[EMAIL_5]",
"source": "regex",
"category": "email"
},
{
"original": "fgoutorbe@ch-cotebasque.fr",
"replacement": "[EMAIL_6]",
"source": "regex",
"category": "email"
},
{
"original": "mcboudier@ch-cotebasque.fr",
"replacement": "[EMAIL_7]",
"source": "regex",
"category": "email"
},
{
"original": "mbrugel@ch-cotebasque.fr",
"replacement": "[EMAIL_8]",
"source": "regex",
"category": "email"
},
{
"original": "mboube@ch-cotebasque.fr",
"replacement": "[EMAIL_9]",
"source": "regex",
"category": "email"
},
{
"original": "faudemar@ch-cotebasque.fr",
"replacement": "[EMAIL_10]",
"source": "regex",
"category": "email"
},
{
"original": "fprevost@ch-cotebasque.fr",
"replacement": "[EMAIL_1]",
"source": "regex",
"category": "email"
},
{
"original": "boui@ch-cotebasque.fr",
"replacement": "[EMAIL_2]",
"source": "regex",
"category": "email"
},
{
"original": "dnivet@ch-cotebasque.fr",
"replacement": "[EMAIL_3]",
"source": "regex",
"category": "email"
},
{
"original": "tkhuong-huu@ch-cotebasque.fr",
"replacement": "[EMAIL_4]",
"source": "regex",
"category": "email"
},
{
"original": "aguilngar@ch-cotebasque.fr",
"replacement": "[EMAIL_5]",
"source": "regex",
"category": "email"
},
{
"original": "fgoutorbe@ch-cotebasque.fr",
"replacement": "[EMAIL_6]",
"source": "regex",
"category": "email"
},
{
"original": "mcboudier@ch-cotebasque.fr",
"replacement": "[EMAIL_7]",
"source": "regex",
"category": "email"
},
{
"original": "mbrugel@ch-cotebasque.fr",
"replacement": "[EMAIL_8]",
"source": "regex",
"category": "email"
},
{
"original": "mboube@ch-cotebasque.fr",
"replacement": "[EMAIL_9]",
"source": "regex",
"category": "email"
},
{
"original": "faudemar@ch-cotebasque.fr",
"replacement": "[EMAIL_10]",
"source": "regex",
"category": "email"
},
{
"original": "PEREIRE",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.8377689719200134
},
{
"original": "J. LOEB",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.8885625600814819
},
{
"original": "BROUZENG Jean-Paul A",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9319342970848083
},
{
"original": "[MEDECIN",
"replacement": "[PERSONNE_4]",
"source": "ner",
"score": 0.8703416585922241
},
{
"original": "Grellety",
"replacement": "[MEDECIN]",
"source": "ner",
"score": 0.9830475449562073
},
{
"original": "[PATIENT_",
"replacement": "[PERSONNE_5]",
"source": "ner",
"score": 0.8875940442085266
},
{
"original": "[MEDECIN_15",
"replacement": "[PERSONNE_6]",
"source": "ner",
"score": 0.8140742182731628
},
{
"original": "[MEDECIN_",
"replacement": "[PERSONNE_7]",
"source": "ner",
"score": 0.9443742632865906
},
{
"original": "ETCHEVERRY Jean-claude",
"replacement": "[PATIENT_4]",
"source": "ner",
"score": 0.9849814176559448
},
{
"original": "ETCHEVERRY JEAN CLAUDE",
"replacement": "[PERSONNE_8]",
"source": "ner",
"score": 0.9797188639640808
}
]
}

View File

@@ -0,0 +1,267 @@
{
"source_file": "trackare-BA119282-23144210_BA119282_23144210.pdf",
"total_replacements": 549,
"regex_replacements": 96,
"ner_replacements": 19,
"sweep_replacements": 434,
"entities_found": [
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23144210",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "151056454701737",
"replacement": "[NIR_1]",
"source": "regex",
"category": "nir"
},
{
"original": "151056454701737",
"replacement": "[NIR_1]",
"source": "regex",
"category": "nir"
},
{
"original": "640000162",
"replacement": "[FINESS]",
"source": "regex",
"category": "finess"
},
{
"original": "64547",
"replacement": "[LIEU_NAISS_2]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "64547",
"replacement": "[LIEU_NAISS_2]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "USTARITZ",
"replacement": "[LIEU_NAISS_1]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "ETCHEVERRY",
"replacement": "[PATIENT]",
"source": "ner",
"score": 0.8786582946777344
},
{
"original": "[MEDECIN",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9375270009040833
},
{
"original": "JEAN-CLAUDE",
"replacement": "[PATIENT]",
"source": "ner",
"score": 0.9499256014823914
},
{
"original": "KWIKPEN SOL MEURAT Aurore",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9933945536613464
},
{
"original": "HUMALOG 300UI KWIKPEN SOL MEURAT Aurore",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9421625137329102
},
{
"original": "MG MEURAT Aurore",
"replacement": "[PERSONNE_4]",
"source": "ner",
"score": 0.895708441734314
},
{
"original": "SPASFON",
"replacement": "[PERSONNE_5]",
"source": "ner",
"score": 0.9559392929077148
},
{
"original": "MEURAT Aurore GELULE",
"replacement": "[PERSONNE_6]",
"source": "ner",
"score": 0.9800611734390259
},
{
"original": "REN MEURAT Aurore",
"replacement": "[PERSONNE_7]",
"source": "ner",
"score": 0.8999844789505005
},
{
"original": "ALMEIRAS Nanciancena",
"replacement": "[PERSONNE_8]",
"source": "ner",
"score": 0.9671063423156738
},
{
"original": "HUMALOG 300UI KWIKPEN SOL",
"replacement": "[PERSONNE_9]",
"source": "ner",
"score": 0.9648926258087158
},
{
"original": "UI KWIKPEN SOL MEURAT Aurore",
"replacement": "[PERSONNE_10]",
"source": "ner",
"score": 0.8747116327285767
},
{
"original": "HUMALOG",
"replacement": "[PERSONNE]",
"source": "ner",
"score": 0.9397028088569641
},
{
"original": "ZYLORIC",
"replacement": "[PERSONNE_11]",
"source": "ner",
"score": 0.928149402141571
},
{
"original": "MEURAT Aurore",
"replacement": "[PERSONNE_12]",
"source": "ner",
"score": 0.9939867258071899
},
{
"original": "CHL REN MEURAT Aurore",
"replacement": "[PERSONNE_13]",
"source": "ner",
"score": 0.8374457359313965
},
{
"original": "Aurore MEURAT",
"replacement": "[SOIGNANT_4]",
"source": "ner",
"score": 0.9987927079200745
},
{
"original": "[MEDECIN_",
"replacement": "[PERSONNE_14]",
"source": "ner",
"score": 0.8582423329353333
},
{
"original": "e Bruder Sandrine",
"replacement": "[PERSONNE_15]",
"source": "ner",
"score": 0.8771246075630188
}
]
}