Files
anonymisation/tests/ground_truth/quality_evaluation/baseline_quality_evaluation.json

441 lines
10 KiB
JSON

{
"evaluation_date": "2026-03-02",
"total_documents": 25,
"global_metrics": {
"precision": 0.1897,
"recall": 1.0,
"f1_score": 0.3189,
"true_positives": 1159,
"false_positives": 4951,
"false_negatives": 0
},
"by_type": {
"ETABLISSEMENT": {
"precision": 1.0,
"recall": 1.0,
"f1_score": 1.0,
"true_positives": 83,
"false_positives": 0,
"false_negatives": 0
},
"TEL": {
"precision": 0.9602,
"recall": 1.0,
"f1_score": 0.9797,
"true_positives": 193,
"false_positives": 8,
"false_negatives": 0
},
"NOM": {
"precision": 1.0,
"recall": 1.0,
"f1_score": 1.0,
"true_positives": 506,
"false_positives": 0,
"false_negatives": 0
},
"IPP": {
"precision": 1.0,
"recall": 1.0,
"f1_score": 1.0,
"true_positives": 25,
"false_positives": 0,
"false_negatives": 0
},
"NOM_EXTRACTED": {
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 3846,
"false_negatives": 0
},
"NOM_GLOBAL": {
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 670,
"false_negatives": 0
},
"ETAB_GLOBAL": {
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 36,
"false_negatives": 0
},
"TEL_GLOBAL": {
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 77,
"false_negatives": 0
},
"ADRESSE": {
"precision": 0.878,
"recall": 1.0,
"f1_score": 0.9351,
"true_positives": 72,
"false_positives": 10,
"false_negatives": 0
},
"CODE_POSTAL": {
"precision": 0.8333,
"recall": 1.0,
"f1_score": 0.9091,
"true_positives": 50,
"false_positives": 10,
"false_negatives": 0
},
"DATE_NAISSANCE": {
"precision": 1.0,
"recall": 1.0,
"f1_score": 1.0,
"true_positives": 114,
"false_positives": 0,
"false_negatives": 0
},
"ADRESSE_GLOBAL": {
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 55,
"false_negatives": 0
},
"CODE_POSTAL_GLOBAL": {
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 39,
"false_negatives": 0
},
"DATE_NAISSANCE_GLOBAL": {
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 20,
"false_negatives": 0
},
"EMAIL": {
"precision": 1.0,
"recall": 1.0,
"f1_score": 1.0,
"true_positives": 62,
"false_positives": 0,
"false_negatives": 0
},
"RPPS": {
"precision": 1.0,
"recall": 1.0,
"f1_score": 1.0,
"true_positives": 21,
"false_positives": 0,
"false_negatives": 0
},
"EPISODE": {
"precision": 0.1452,
"recall": 1.0,
"f1_score": 0.2535,
"true_positives": 18,
"false_positives": 106,
"false_negatives": 0
},
"EMAIL_GLOBAL": {
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 28,
"false_negatives": 0
},
"RPPS_GLOBAL": {
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 7,
"false_negatives": 0
},
"EPISODE_GLOBAL": {
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 9,
"false_negatives": 0
},
"VILLE": {
"precision": 0.2,
"recall": 1.0,
"f1_score": 0.3333,
"true_positives": 5,
"false_positives": 20,
"false_negatives": 0
},
"VILLE_GLOBAL": {
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 10,
"false_negatives": 0
},
"AGE": {
"precision": 1.0,
"recall": 1.0,
"f1_score": 1.0,
"true_positives": 5,
"false_positives": 0,
"false_negatives": 0
},
"NIR": {
"precision": 1.0,
"recall": 1.0,
"f1_score": 1.0,
"true_positives": 2,
"false_positives": 0,
"false_negatives": 0
},
"DOSSIER": {
"precision": 1.0,
"recall": 1.0,
"f1_score": 1.0,
"true_positives": 3,
"false_positives": 0,
"false_negatives": 0
}
},
"per_document": [
{
"pdf": "001_simple_unknown_BACTERIO_23018396",
"precision": 0.2326,
"recall": 1.0,
"f1_score": 0.3774,
"true_positives": 10,
"false_positives": 33,
"false_negatives": 0
},
{
"pdf": "002_simple_unknown_bacterio_476_23159413",
"precision": 0.234,
"recall": 1.0,
"f1_score": 0.3793,
"true_positives": 11,
"false_positives": 36,
"false_negatives": 0
},
{
"pdf": "003_simple_compte_rendu_CRO_23155084",
"precision": 0.16,
"recall": 1.0,
"f1_score": 0.2759,
"true_positives": 4,
"false_positives": 21,
"false_negatives": 0
},
{
"pdf": "004_simple_anapath_anapath_53_23224186.redacted_raster",
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 0,
"false_negatives": 0
},
{
"pdf": "005_simple_compte_rendu_CRH_23155836",
"precision": 0.4429,
"recall": 1.0,
"f1_score": 0.6139,
"true_positives": 62,
"false_positives": 78,
"false_negatives": 0
},
{
"pdf": "008_simple_trackare_trackare-14004105-23202435_14004105_23202435",
"precision": 0.1899,
"recall": 1.0,
"f1_score": 0.3191,
"true_positives": 15,
"false_positives": 64,
"false_negatives": 0
},
{
"pdf": "009_simple_compte_rendu_CRO_23051225",
"precision": 0.25,
"recall": 1.0,
"f1_score": 0.4,
"true_positives": 8,
"false_positives": 24,
"false_negatives": 0
},
{
"pdf": "010_simple_anapath_ANAPATH_23217289",
"precision": 0.2549,
"recall": 1.0,
"f1_score": 0.4062,
"true_positives": 13,
"false_positives": 38,
"false_negatives": 0
},
{
"pdf": "011_moyen_compte_rendu_CRH_23080179",
"precision": 0.3158,
"recall": 1.0,
"f1_score": 0.48,
"true_positives": 12,
"false_positives": 26,
"false_negatives": 0
},
{
"pdf": "012_moyen_compte_rendu_CRH_692_23200418",
"precision": 0.297,
"recall": 1.0,
"f1_score": 0.458,
"true_positives": 30,
"false_positives": 71,
"false_negatives": 0
},
{
"pdf": "013_moyen_compte_rendu_363_23085243_CRO",
"precision": 0.2025,
"recall": 1.0,
"f1_score": 0.3368,
"true_positives": 32,
"false_positives": 126,
"false_negatives": 0
},
{
"pdf": "014_moyen_compte_rendu_CRO_23167029.redacted_raster",
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 0,
"false_negatives": 0
},
{
"pdf": "015_moyen_unknown_CONSULTATION_ANESTHESISTE_23139653",
"precision": 0.28,
"recall": 1.0,
"f1_score": 0.4375,
"true_positives": 7,
"false_positives": 18,
"false_negatives": 0
},
{
"pdf": "016_moyen_compte_rendu_CRH_23149905",
"precision": 0.477,
"recall": 1.0,
"f1_score": 0.6459,
"true_positives": 114,
"false_positives": 125,
"false_negatives": 0
},
{
"pdf": "017_moyen_compte_rendu_CRO_23222062.redacted_raster",
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 0,
"false_negatives": 0
},
{
"pdf": "018_moyen_compte_rendu_CRH_23042753",
"precision": 0.5279,
"recall": 1.0,
"f1_score": 0.691,
"true_positives": 123,
"false_positives": 110,
"false_negatives": 0
},
{
"pdf": "019_moyen_compte_rendu_CRO_332_23049003",
"precision": 0.3793,
"recall": 1.0,
"f1_score": 0.55,
"true_positives": 55,
"false_positives": 90,
"false_negatives": 0
},
{
"pdf": "020_moyen_compte_rendu_CRO_23084754.redacted_raster",
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 0,
"false_negatives": 0
},
{
"pdf": "021_moyen_compte_rendu_CRO_23201117.redacted_raster",
"precision": 0.0,
"recall": 0.0,
"f1_score": 0.0,
"true_positives": 0,
"false_positives": 0,
"false_negatives": 0
},
{
"pdf": "022_moyen_compte_rendu_cro2_516_23187028",
"precision": 0.1379,
"recall": 1.0,
"f1_score": 0.2424,
"true_positives": 4,
"false_positives": 25,
"false_negatives": 0
},
{
"pdf": "023_complexe_compte_rendu_CRH_23102610",
"precision": 0.6203,
"recall": 1.0,
"f1_score": 0.7657,
"true_positives": 379,
"false_positives": 232,
"false_negatives": 0
},
{
"pdf": "024_complexe_trackare_trackare-17001141-23066188_17001141_23066188",
"precision": 0.0689,
"recall": 1.0,
"f1_score": 0.129,
"true_positives": 53,
"false_positives": 716,
"false_negatives": 0
},
{
"pdf": "025_complexe_trackare_trackare-02016820-23095226_02016820_23095226",
"precision": 0.0643,
"recall": 1.0,
"f1_score": 0.1209,
"true_positives": 96,
"false_positives": 1396,
"false_negatives": 0
},
{
"pdf": "026_complexe_trackare_trackare-15000536-23074384_15000536_23074384",
"precision": 0.0766,
"recall": 1.0,
"f1_score": 0.1422,
"true_positives": 79,
"false_positives": 953,
"false_negatives": 0
},
{
"pdf": "027_complexe_trackare_trackare-10027557-23183041_10027557_23183041",
"precision": 0.0633,
"recall": 1.0,
"f1_score": 0.1191,
"true_positives": 52,
"false_positives": 769,
"false_negatives": 0
}
]
}