chore: add .gitignore

This commit is contained in:
dom
2026-03-05 00:37:34 +01:00
parent da34bdc8d7
commit d2e0fec97d
2087 changed files with 1485338 additions and 14 deletions

View File

@@ -0,0 +1,81 @@
{
"source_file": "BACTERIO 23102610.pdf",
"total_replacements": 20,
"regex_replacements": 9,
"ner_replacements": 11,
"sweep_replacements": 0,
"entities_found": [
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "BARGAIN Beatrice",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9946607351303101
},
{
"original": "GSCHWIND Marion",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9941439628601074
},
{
"original": "BRONSWICK",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9853192567825317
},
{
"original": "BRONSWICK Gildas",
"replacement": "[PERSONNE_4]",
"source": "ner",
"score": 0.9887723922729492
},
{
"original": "DECOEUR Lucie",
"replacement": "[MEDECIN_10]",
"source": "ner",
"score": 0.9970130920410156
},
{
"original": "[MEDECIN_",
"replacement": "[PERSONNE_5]",
"source": "ner",
"score": 0.937204897403717
},
{
"original": "MONIER Laurie",
"replacement": "[MEDECIN_8]",
"source": "ner",
"score": 0.9974474906921387
},
{
"original": "GUILLEMAUD Julien",
"replacement": "[MEDECIN_6]",
"source": "ner",
"score": 0.998172402381897
},
{
"original": "[MEDECIN",
"replacement": "[PERSONNE_6]",
"source": "ner",
"score": 0.9457688331604004
},
{
"original": "LEYSSENE David",
"replacement": "[MEDECIN_3]",
"source": "ner",
"score": 0.9976966977119446
},
{
"original": "Jacques Loëb",
"replacement": "[PERSONNE_7]",
"source": "ner",
"score": 0.9719934463500977
}
]
}

View File

@@ -0,0 +1,261 @@
{
"source_file": "CRH 23102610.pdf",
"total_replacements": 481,
"regex_replacements": 298,
"ner_replacements": 39,
"sweep_replacements": 144,
"entities_found": [
{
"original": "10100402527",
"replacement": "[CODE_BARRE_1]",
"source": "regex",
"category": "code_barre"
},
{
"original": "10100402527",
"replacement": "[CODE_BARRE_1]",
"source": "regex",
"category": "code_barre"
},
{
"original": "10100402527",
"replacement": "[CODE_BARRE_1]",
"source": "regex",
"category": "code_barre"
},
{
"original": "[MEDECIN_61",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9211746454238892
},
{
"original": "[MEDECIN",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9492493867874146
},
{
"original": "Julien MARY",
"replacement": "[MEDECIN_19]",
"source": "ner",
"score": 0.9972638487815857
},
{
"original": "'HALLUIN",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.9035077095031738
},
{
"original": "Laure ALLEMAN PR. LOISEAU Hugues",
"replacement": "[PERSONNE_4]",
"source": "ner",
"score": 0.9858086705207825
},
{
"original": "ARISTEGUY Jacques",
"replacement": "[MEDECIN_29]",
"source": "ner",
"score": 0.9983139038085938
},
{
"original": "Dr [MEDECIN",
"replacement": "[PERSONNE_5]",
"source": "ner",
"score": 0.8403686881065369
},
{
"original": "Monsieur [PATIENT",
"replacement": "[PERSONNE_6]",
"source": "ner",
"score": 0.8921545147895813
},
{
"original": "Dr [MEDECIN_",
"replacement": "[PERSONNE_7]",
"source": "ner",
"score": 0.8567573428153992
},
{
"original": "MEDEC",
"replacement": "[PERSONNE_8]",
"source": "ner",
"score": 0.8267822861671448
},
{
"original": "[MEDECIN_49",
"replacement": "[PERSONNE_9]",
"source": "ner",
"score": 0.9664043188095093
},
{
"original": "[MEDECIN_",
"replacement": "[PERSONNE]",
"source": "ner",
"score": 0.9854629635810852
},
{
"original": "Matutes",
"replacement": "[PERSONNE_10]",
"source": "ner",
"score": 0.9714286923408508
},
{
"original": "[MEDECIN_47",
"replacement": "[PERSONNE_11]",
"source": "ner",
"score": 0.9220735430717468
},
{
"original": "J. LOEB",
"replacement": "[PERSONNE_12]",
"source": "ner",
"score": 0.9792612195014954
},
{
"original": "[MEDECIN_41",
"replacement": "[PERSONNE_13]",
"source": "ner",
"score": 0.9370009303092957
},
{
"original": "[MEDECIN_66",
"replacement": "[PERSONNE_14]",
"source": "ner",
"score": 0.8901724219322205
},
{
"original": "57 BOULEVARD GENERAL LECLERC Dr [MEDECIN_",
"replacement": "[PERSONNE_15]",
"source": "ner",
"score": 0.9171126484870911
},
{
"original": "Irène MACHELART",
"replacement": "[MEDECIN_25]",
"source": "ner",
"score": 0.9988975524902344
},
{
"original": "Alexia HOURDILLE",
"replacement": "[MEDECIN_23]",
"source": "ner",
"score": 0.9989216923713684
},
{
"original": "Mathieu AUZI",
"replacement": "[MEDECIN_9]",
"source": "ner",
"score": 0.9983761310577393
},
{
"original": "Laurence RITZ-QUILLACQ",
"replacement": "[MEDECIN_7]",
"source": "ner",
"score": 0.998863697052002
},
{
"original": "[MEDECIN_44",
"replacement": "[PERSONNE_16]",
"source": "ner",
"score": 0.8365264534950256
},
{
"original": "MAURY Elisa",
"replacement": "[MEDECIN_28]",
"source": "ner",
"score": 0.9980913400650024
},
{
"original": "[MEDECIN_30",
"replacement": "[PERSONNE_17]",
"source": "ner",
"score": 0.9518200755119324
},
{
"original": "[MEDECIN_48",
"replacement": "[PERSONNE_18]",
"source": "ner",
"score": 0.9446713328361511
},
{
"original": "[MEDECIN_50",
"replacement": "[PERSONNE_19]",
"source": "ner",
"score": 0.9095359444618225
},
{
"original": "[MEDECIN_52",
"replacement": "[PERSONNE_20]",
"source": "ner",
"score": 0.9573572278022766
},
{
"original": "[MEDECIN_53",
"replacement": "[PERSONNE_21]",
"source": "ner",
"score": 0.9611626863479614
},
{
"original": "Laure ALLEMAN",
"replacement": "[MEDECIN_14]",
"source": "ner",
"score": 0.9981555342674255
},
{
"original": "[MEDECIN_39",
"replacement": "[PERSONNE_22]",
"source": "ner",
"score": 0.9500394463539124
},
{
"original": "[MEDECIN_58",
"replacement": "[PERSONNE_23]",
"source": "ner",
"score": 0.9476885795593262
},
{
"original": "[MEDECIN_59",
"replacement": "[PERSONNE_24]",
"source": "ner",
"score": 0.9671294093132019
},
{
"original": "Pr Loiseau",
"replacement": "[PERSONNE_25]",
"source": "ner",
"score": 0.8719029426574707
},
{
"original": "Thibault MOLES",
"replacement": "[MEDECIN_20]",
"source": "ner",
"score": 0.9977443814277649
},
{
"original": "[MEDECIN_37",
"replacement": "[PERSONNE_26]",
"source": "ner",
"score": 0.8874963521957397
},
{
"original": "Heidi WILLE",
"replacement": "[MEDECIN_13]",
"source": "ner",
"score": 0.997164249420166
},
{
"original": "Anne BARTEAU",
"replacement": "[MEDECIN_4]",
"source": "ner",
"score": 0.9978933930397034
},
{
"original": "BRONSWICK GILDAS",
"replacement": "[PATIENT_2]",
"source": "ner",
"score": 0.9983031749725342
}
]
}

View File

@@ -0,0 +1,441 @@
{
"source_file": "trackare-01290152-23102610_01290152_23102610.pdf",
"total_replacements": 425,
"regex_replacements": 98,
"ner_replacements": 36,
"sweep_replacements": 291,
"entities_found": [
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "01290152",
"replacement": "[IPP_1]",
"source": "regex",
"category": "ipp"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "23102610",
"replacement": "[EPISODE_1]",
"source": "regex",
"category": "episode"
},
{
"original": "640000162",
"replacement": "[FINESS]",
"source": "regex",
"category": "finess"
},
{
"original": "CHAMPIGNY-SUR-MARNE",
"replacement": "[LIEU_NAISS_1]",
"source": "regex",
"category": "lieu_naissance"
},
{
"original": "JAOUEN",
"replacement": "[PERSONNE_1]",
"source": "ner",
"score": 0.9962719678878784
},
{
"original": "Rémi SEGUES",
"replacement": "[PERSONNE_2]",
"source": "ner",
"score": 0.9978815317153931
},
{
"original": "[MEDECIN_10",
"replacement": "[PERSONNE_3]",
"source": "ner",
"score": 0.8847193121910095
},
{
"original": "[MEDECIN",
"replacement": "[PERSONNE_4]",
"source": "ner",
"score": 0.985040545463562
},
{
"original": "[MEDECIN_",
"replacement": "[PERSONNE_5]",
"source": "ner",
"score": 0.9797776341438293
},
{
"original": "Oui",
"replacement": "[PERSONNE_6]",
"source": "ner",
"score": 0.9501992464065552
},
{
"original": "LARQUIER Camille Signé",
"replacement": "[PERSONNE_7]",
"source": "ner",
"score": 0.9967018961906433
},
{
"original": "MAJCHRZAK Camille Marie Signé",
"replacement": "[PERSONNE_8]",
"source": "ner",
"score": 0.9987678527832031
},
{
"original": "MAJCHRZAK Camille Signé",
"replacement": "[PERSONNE_9]",
"source": "ner",
"score": 0.997112512588501
},
{
"original": "GLYCEMIE CAPILLAIRE",
"replacement": "[PERSONNE_10]",
"source": "ner",
"score": 0.993213951587677
},
{
"original": "BRAYER Céline Signé",
"replacement": "[PERSONNE_11]",
"source": "ner",
"score": 0.9806097149848938
},
{
"original": "BRAYER Céline",
"replacement": "[PERSONNE_12]",
"source": "ner",
"score": 0.9857642650604248
},
{
"original": "LYCEMIE CAPILLAIRE",
"replacement": "[PERSONNE_13]",
"source": "ner",
"score": 0.8009800910949707
},
{
"original": "Céline Signé",
"replacement": "[PERSONNE_14]",
"source": "ner",
"score": 0.993458092212677
},
{
"original": "LARQUIER Camille",
"replacement": "[PERSONNE_15]",
"source": "ner",
"score": 0.9880821108818054
},
{
"original": "Camille PATIENT",
"replacement": "[PERSONNE_16]",
"source": "ner",
"score": 0.9125155806541443
},
{
"original": "MAJCHRZAK Camille",
"replacement": "[PERSONNE_17]",
"source": "ner",
"score": 0.9927541017532349
},
{
"original": "Marie",
"replacement": "[SOIGNANT]",
"source": "ner",
"score": 0.9366453289985657
},
{
"original": "Marie INJ",
"replacement": "[PERSONNE_18]",
"source": "ner",
"score": 0.9020470976829529
},
{
"original": "Marie ORALE",
"replacement": "[PERSONNE_19]",
"source": "ner",
"score": 0.9948503971099854
},
{
"original": "Marie CREME",
"replacement": "[PERSONNE_20]",
"source": "ner",
"score": 0.9910940527915955
},
{
"original": "CUTANEE MAJCHRZAK Camille",
"replacement": "[PERSONNE_21]",
"source": "ner",
"score": 0.9586679339408875
},
{
"original": "Céline S",
"replacement": "[PERSONNE_22]",
"source": "ner",
"score": 0.8429950475692749
},
{
"original": "LARQUIER",
"replacement": "[PERSONNE]",
"source": "ner",
"score": 0.9438746571540833
},
{
"original": "Camille Marie MAJCHRZAK",
"replacement": "[PERSONNE_23]",
"source": "ner",
"score": 0.9951679706573486
},
{
"original": "MAJCHRZAK",
"replacement": "[MEDECIN]",
"source": "ner",
"score": 0.987483024597168
},
{
"original": "Camille Marie",
"replacement": "[PERSONNE_24]",
"source": "ner",
"score": 0.981324315071106
},
{
"original": "MAJCH",
"replacement": "[PERSONNE_25]",
"source": "ner",
"score": 0.8898651599884033
},
{
"original": "Camille Marie INJ STYLO",
"replacement": "[PERSONNE_26]",
"source": "ner",
"score": 0.9957061409950256
},
{
"original": "Eileen PAWLAK",
"replacement": "[PERSONNE_27]",
"source": "ner",
"score": 0.9977694153785706
},
{
"original": "Loiseau",
"replacement": "[PERSONNE_28]",
"source": "ner",
"score": 0.9924784898757935
},
{
"original": "Janumet",
"replacement": "[PERSONNE_29]",
"source": "ner",
"score": 0.9008945822715759
},
{
"original": "Matutes",
"replacement": "[PERSONNE_30]",
"source": "ner",
"score": 0.9717926979064941
},
{
"original": "Pr Loiseau",
"replacement": "[PERSONNE_31]",
"source": "ner",
"score": 0.8556192517280579
},
{
"original": "LAGNAOUI",
"replacement": "[PERSONNE_32]",
"source": "ner",
"score": 0.8377308249473572
},
{
"original": "J. LOEB",
"replacement": "[PERSONNE_33]",
"source": "ner",
"score": 0.8255879878997803
}
]
}