324 lines
18 KiB
JSON
324 lines
18 KiB
JSON
{
|
|
"date": "2026-03-02T11:15:25.581162",
|
|
"total_documents": 27,
|
|
"success_count": 25,
|
|
"total_pii": 1598,
|
|
"total_time_s": 44.145431995391846,
|
|
"avg_time_s": 1.6350159998293277,
|
|
"use_ner": true,
|
|
"use_vlm": false,
|
|
"results": [
|
|
{
|
|
"pdf": "001_simple_unknown_BACTERIO_23018396.pdf",
|
|
"success": true,
|
|
"time_s": 0.3523738384246826,
|
|
"pii_count": 10,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/001_simple_unknown_BACTERIO_23018396.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/001_simple_unknown_BACTERIO_23018396.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/001_simple_unknown_BACTERIO_23018396.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/001_simple_unknown_BACTERIO_23018396.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "002_simple_unknown_bacterio_476_23159413.pdf",
|
|
"success": true,
|
|
"time_s": 0.574472188949585,
|
|
"pii_count": 11,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/002_simple_unknown_bacterio_476_23159413.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/002_simple_unknown_bacterio_476_23159413.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/002_simple_unknown_bacterio_476_23159413.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/002_simple_unknown_bacterio_476_23159413.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "003_simple_compte_rendu_CRO_23155084.pdf",
|
|
"success": true,
|
|
"time_s": 0.3953683376312256,
|
|
"pii_count": 4,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/003_simple_compte_rendu_CRO_23155084.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/003_simple_compte_rendu_CRO_23155084.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/003_simple_compte_rendu_CRO_23155084.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/003_simple_compte_rendu_CRO_23155084.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "004_simple_anapath_anapath_53_23224186.redacted_raster.pdf",
|
|
"success": true,
|
|
"time_s": 0.3364546298980713,
|
|
"pii_count": 0,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/004_simple_anapath_anapath_53_23224186.redacted_raster.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/004_simple_anapath_anapath_53_23224186.redacted_raster.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/004_simple_anapath_anapath_53_23224186.redacted_raster.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/004_simple_anapath_anapath_53_23224186.redacted_raster.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "005_simple_compte_rendu_CRH_23155836.pdf",
|
|
"success": true,
|
|
"time_s": 0.7666671276092529,
|
|
"pii_count": 62,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/005_simple_compte_rendu_CRH_23155836.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/005_simple_compte_rendu_CRH_23155836.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/005_simple_compte_rendu_CRH_23155836.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/005_simple_compte_rendu_CRH_23155836.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "006_simple_anapath_ANAPATH_23142660.pdf",
|
|
"success": false,
|
|
"time_s": 0.0017955303192138672,
|
|
"error": ""
|
|
},
|
|
{
|
|
"pdf": "007_simple_anapath_ANAPATH_23096332.pdf",
|
|
"success": false,
|
|
"time_s": 0.0013647079467773438,
|
|
"error": ""
|
|
},
|
|
{
|
|
"pdf": "008_simple_trackare_trackare-14004105-23202435_14004105_23202435.pdf",
|
|
"success": true,
|
|
"time_s": 0.40996646881103516,
|
|
"pii_count": 40,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/008_simple_trackare_trackare-14004105-23202435_14004105_23202435.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/008_simple_trackare_trackare-14004105-23202435_14004105_23202435.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/008_simple_trackare_trackare-14004105-23202435_14004105_23202435.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/008_simple_trackare_trackare-14004105-23202435_14004105_23202435.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "009_simple_compte_rendu_CRO_23051225.pdf",
|
|
"success": true,
|
|
"time_s": 0.4464128017425537,
|
|
"pii_count": 12,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/009_simple_compte_rendu_CRO_23051225.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/009_simple_compte_rendu_CRO_23051225.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/009_simple_compte_rendu_CRO_23051225.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/009_simple_compte_rendu_CRO_23051225.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "010_simple_anapath_ANAPATH_23217289.pdf",
|
|
"success": true,
|
|
"time_s": 0.3622779846191406,
|
|
"pii_count": 16,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/010_simple_anapath_ANAPATH_23217289.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/010_simple_anapath_ANAPATH_23217289.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/010_simple_anapath_ANAPATH_23217289.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/010_simple_anapath_ANAPATH_23217289.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "011_moyen_compte_rendu_CRH_23080179.pdf",
|
|
"success": true,
|
|
"time_s": 0.9325697422027588,
|
|
"pii_count": 20,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/011_moyen_compte_rendu_CRH_23080179.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/011_moyen_compte_rendu_CRH_23080179.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/011_moyen_compte_rendu_CRH_23080179.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/011_moyen_compte_rendu_CRH_23080179.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "012_moyen_compte_rendu_CRH_692_23200418.pdf",
|
|
"success": true,
|
|
"time_s": 0.6736557483673096,
|
|
"pii_count": 32,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/012_moyen_compte_rendu_CRH_692_23200418.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/012_moyen_compte_rendu_CRH_692_23200418.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/012_moyen_compte_rendu_CRH_692_23200418.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/012_moyen_compte_rendu_CRH_692_23200418.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "013_moyen_compte_rendu_363_23085243_CRO.pdf",
|
|
"success": true,
|
|
"time_s": 0.6802682876586914,
|
|
"pii_count": 34,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/013_moyen_compte_rendu_363_23085243_CRO.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/013_moyen_compte_rendu_363_23085243_CRO.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/013_moyen_compte_rendu_363_23085243_CRO.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/013_moyen_compte_rendu_363_23085243_CRO.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "014_moyen_compte_rendu_CRO_23167029.redacted_raster.pdf",
|
|
"success": true,
|
|
"time_s": 0.4354434013366699,
|
|
"pii_count": 0,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/014_moyen_compte_rendu_CRO_23167029.redacted_raster.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/014_moyen_compte_rendu_CRO_23167029.redacted_raster.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/014_moyen_compte_rendu_CRO_23167029.redacted_raster.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/014_moyen_compte_rendu_CRO_23167029.redacted_raster.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "015_moyen_unknown_CONSULTATION_ANESTHESISTE_23139653.pdf",
|
|
"success": true,
|
|
"time_s": 0.9319710731506348,
|
|
"pii_count": 7,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/015_moyen_unknown_CONSULTATION_ANESTHESISTE_23139653.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/015_moyen_unknown_CONSULTATION_ANESTHESISTE_23139653.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/015_moyen_unknown_CONSULTATION_ANESTHESISTE_23139653.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/015_moyen_unknown_CONSULTATION_ANESTHESISTE_23139653.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "016_moyen_compte_rendu_CRH_23149905.pdf",
|
|
"success": true,
|
|
"time_s": 1.150942325592041,
|
|
"pii_count": 117,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/016_moyen_compte_rendu_CRH_23149905.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/016_moyen_compte_rendu_CRH_23149905.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/016_moyen_compte_rendu_CRH_23149905.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/016_moyen_compte_rendu_CRH_23149905.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "017_moyen_compte_rendu_CRO_23222062.redacted_raster.pdf",
|
|
"success": true,
|
|
"time_s": 0.43438720703125,
|
|
"pii_count": 0,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/017_moyen_compte_rendu_CRO_23222062.redacted_raster.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/017_moyen_compte_rendu_CRO_23222062.redacted_raster.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/017_moyen_compte_rendu_CRO_23222062.redacted_raster.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/017_moyen_compte_rendu_CRO_23222062.redacted_raster.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "018_moyen_compte_rendu_CRH_23042753.pdf",
|
|
"success": true,
|
|
"time_s": 1.5716781616210938,
|
|
"pii_count": 123,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/018_moyen_compte_rendu_CRH_23042753.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/018_moyen_compte_rendu_CRH_23042753.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/018_moyen_compte_rendu_CRH_23042753.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/018_moyen_compte_rendu_CRH_23042753.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "019_moyen_compte_rendu_CRO_332_23049003.pdf",
|
|
"success": true,
|
|
"time_s": 0.7931430339813232,
|
|
"pii_count": 71,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/019_moyen_compte_rendu_CRO_332_23049003.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/019_moyen_compte_rendu_CRO_332_23049003.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/019_moyen_compte_rendu_CRO_332_23049003.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/019_moyen_compte_rendu_CRO_332_23049003.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "020_moyen_compte_rendu_CRO_23084754.redacted_raster.pdf",
|
|
"success": true,
|
|
"time_s": 0.43088579177856445,
|
|
"pii_count": 0,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/020_moyen_compte_rendu_CRO_23084754.redacted_raster.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/020_moyen_compte_rendu_CRO_23084754.redacted_raster.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/020_moyen_compte_rendu_CRO_23084754.redacted_raster.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/020_moyen_compte_rendu_CRO_23084754.redacted_raster.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "021_moyen_compte_rendu_CRO_23201117.redacted_raster.pdf",
|
|
"success": true,
|
|
"time_s": 0.3120863437652588,
|
|
"pii_count": 0,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/021_moyen_compte_rendu_CRO_23201117.redacted_raster.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/021_moyen_compte_rendu_CRO_23201117.redacted_raster.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/021_moyen_compte_rendu_CRO_23201117.redacted_raster.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/021_moyen_compte_rendu_CRO_23201117.redacted_raster.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "022_moyen_compte_rendu_cro2_516_23187028.pdf",
|
|
"success": true,
|
|
"time_s": 0.35700511932373047,
|
|
"pii_count": 4,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/022_moyen_compte_rendu_cro2_516_23187028.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/022_moyen_compte_rendu_cro2_516_23187028.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/022_moyen_compte_rendu_cro2_516_23187028.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/022_moyen_compte_rendu_cro2_516_23187028.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "023_complexe_compte_rendu_CRH_23102610.pdf",
|
|
"success": true,
|
|
"time_s": 2.7280702590942383,
|
|
"pii_count": 385,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/023_complexe_compte_rendu_CRH_23102610.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/023_complexe_compte_rendu_CRH_23102610.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/023_complexe_compte_rendu_CRH_23102610.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/023_complexe_compte_rendu_CRH_23102610.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "024_complexe_trackare_trackare-17001141-23066188_17001141_23066188.pdf",
|
|
"success": true,
|
|
"time_s": 5.714028835296631,
|
|
"pii_count": 117,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/024_complexe_trackare_trackare-17001141-23066188_17001141_23066188.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/024_complexe_trackare_trackare-17001141-23066188_17001141_23066188.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/024_complexe_trackare_trackare-17001141-23066188_17001141_23066188.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/024_complexe_trackare_trackare-17001141-23066188_17001141_23066188.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "025_complexe_trackare_trackare-02016820-23095226_02016820_23095226.pdf",
|
|
"success": true,
|
|
"time_s": 9.729689836502075,
|
|
"pii_count": 270,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/025_complexe_trackare_trackare-02016820-23095226_02016820_23095226.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/025_complexe_trackare_trackare-02016820-23095226_02016820_23095226.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/025_complexe_trackare_trackare-02016820-23095226_02016820_23095226.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/025_complexe_trackare_trackare-02016820-23095226_02016820_23095226.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "026_complexe_trackare_trackare-15000536-23074384_15000536_23074384.pdf",
|
|
"success": true,
|
|
"time_s": 7.467007637023926,
|
|
"pii_count": 142,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/026_complexe_trackare_trackare-15000536-23074384_15000536_23074384.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/026_complexe_trackare_trackare-15000536-23074384_15000536_23074384.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/026_complexe_trackare_trackare-15000536-23074384_15000536_23074384.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/026_complexe_trackare_trackare-15000536-23074384_15000536_23074384.redacted_raster.pdf"
|
|
}
|
|
},
|
|
{
|
|
"pdf": "027_complexe_trackare_trackare-10027557-23183041_10027557_23183041.pdf",
|
|
"success": true,
|
|
"time_s": 6.15097975730896,
|
|
"pii_count": 121,
|
|
"files": {
|
|
"text": "tests/ground_truth/pdfs/baseline_anonymized/027_complexe_trackare_trackare-10027557-23183041_10027557_23183041.pseudonymise.txt",
|
|
"audit": "tests/ground_truth/pdfs/baseline_anonymized/027_complexe_trackare_trackare-10027557-23183041_10027557_23183041.audit.jsonl",
|
|
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/027_complexe_trackare_trackare-10027557-23183041_10027557_23183041.redacted_vector.pdf",
|
|
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/027_complexe_trackare_trackare-10027557-23183041_10027557_23183041.redacted_raster.pdf"
|
|
}
|
|
}
|
|
]
|
|
} |