feat: Benchmark de performance baseline - 2.62s/doc moyen, 92% dans objectif
This commit is contained in:
26
tests/ground_truth/benchmarks/baseline_benchmark.csv
Normal file
26
tests/ground_truth/benchmarks/baseline_benchmark.csv
Normal file
@@ -0,0 +1,26 @@
|
||||
pdf,time_s,pii_count
|
||||
001_simple_unknown_BACTERIO_23018396.pdf,0.38307929039001465,43
|
||||
002_simple_unknown_bacterio_476_23159413.pdf,0.7698535919189453,47
|
||||
003_simple_compte_rendu_CRO_23155084.pdf,0.41591382026672363,25
|
||||
004_simple_anapath_anapath_53_23224186.redacted_raster.pdf,0.3458268642425537,0
|
||||
005_simple_compte_rendu_CRH_23155836.pdf,0.8738148212432861,140
|
||||
008_simple_trackare_trackare-14004105-23202435_14004105_23202435.pdf,0.4308145046234131,93
|
||||
009_simple_compte_rendu_CRO_23051225.pdf,0.47577404975891113,36
|
||||
010_simple_anapath_ANAPATH_23217289.pdf,0.39705705642700195,54
|
||||
011_moyen_compte_rendu_CRH_23080179.pdf,1.0042967796325684,46
|
||||
012_moyen_compte_rendu_CRH_692_23200418.pdf,0.8403730392456055,103
|
||||
013_moyen_compte_rendu_363_23085243_CRO.pdf,0.94016432762146,160
|
||||
014_moyen_compte_rendu_CRO_23167029.redacted_raster.pdf,0.4384956359863281,0
|
||||
015_moyen_unknown_CONSULTATION_ANESTHESISTE_23139653.pdf,0.9846677780151367,25
|
||||
016_moyen_compte_rendu_CRH_23149905.pdf,1.4508278369903564,242
|
||||
017_moyen_compte_rendu_CRO_23222062.redacted_raster.pdf,0.4350569248199463,0
|
||||
018_moyen_compte_rendu_CRH_23042753.pdf,1.9062294960021973,233
|
||||
019_moyen_compte_rendu_CRO_332_23049003.pdf,1.020752191543579,161
|
||||
020_moyen_compte_rendu_CRO_23084754.redacted_raster.pdf,0.4804375171661377,0
|
||||
021_moyen_compte_rendu_CRO_23201117.redacted_raster.pdf,0.31412649154663086,0
|
||||
022_moyen_compte_rendu_cro2_516_23187028.pdf,0.37198877334594727,29
|
||||
023_complexe_compte_rendu_CRH_23102610.pdf,4.054161310195923,617
|
||||
024_complexe_trackare_trackare-17001141-23066188_17001141_23066188.pdf,8.550535917282104,804
|
||||
025_complexe_trackare_trackare-02016820-23095226_02016820_23095226.pdf,17.83988666534424,1622
|
||||
026_complexe_trackare_trackare-15000536-23074384_15000536_23074384.pdf,12.040966749191284,1056
|
||||
027_complexe_trackare_trackare-10027557-23183041_10027557_23183041.pdf,8.782238721847534,859
|
||||
|
151
tests/ground_truth/benchmarks/baseline_benchmark.json
Normal file
151
tests/ground_truth/benchmarks/baseline_benchmark.json
Normal file
@@ -0,0 +1,151 @@
|
||||
{
|
||||
"date": "2026-03-02T10:41:42.160164",
|
||||
"batch_date": "2026-03-02T10:29:28.280047",
|
||||
"configuration": {
|
||||
"use_ner": true,
|
||||
"use_vlm": false
|
||||
},
|
||||
"statistics": {
|
||||
"total_documents": 25,
|
||||
"total_time_s": 65.54734015464783,
|
||||
"avg_time_s": 2.621893606185913,
|
||||
"median_time_s": 0.8403730392456055,
|
||||
"min_time_s": 0.31412649154663086,
|
||||
"max_time_s": 17.83988666534424,
|
||||
"stdev_time_s": 4.432960605030657,
|
||||
"total_pii": 6395,
|
||||
"avg_pii": 255.8,
|
||||
"median_pii": 54,
|
||||
"min_pii": 0,
|
||||
"max_pii": 1622,
|
||||
"docs_per_second": 0.3814037295947744,
|
||||
"pii_per_second": 97.5630740303433
|
||||
},
|
||||
"documents": [
|
||||
{
|
||||
"pdf": "001_simple_unknown_BACTERIO_23018396.pdf",
|
||||
"time_s": 0.38307929039001465,
|
||||
"pii_count": 43
|
||||
},
|
||||
{
|
||||
"pdf": "002_simple_unknown_bacterio_476_23159413.pdf",
|
||||
"time_s": 0.7698535919189453,
|
||||
"pii_count": 47
|
||||
},
|
||||
{
|
||||
"pdf": "003_simple_compte_rendu_CRO_23155084.pdf",
|
||||
"time_s": 0.41591382026672363,
|
||||
"pii_count": 25
|
||||
},
|
||||
{
|
||||
"pdf": "004_simple_anapath_anapath_53_23224186.redacted_raster.pdf",
|
||||
"time_s": 0.3458268642425537,
|
||||
"pii_count": 0
|
||||
},
|
||||
{
|
||||
"pdf": "005_simple_compte_rendu_CRH_23155836.pdf",
|
||||
"time_s": 0.8738148212432861,
|
||||
"pii_count": 140
|
||||
},
|
||||
{
|
||||
"pdf": "008_simple_trackare_trackare-14004105-23202435_14004105_23202435.pdf",
|
||||
"time_s": 0.4308145046234131,
|
||||
"pii_count": 93
|
||||
},
|
||||
{
|
||||
"pdf": "009_simple_compte_rendu_CRO_23051225.pdf",
|
||||
"time_s": 0.47577404975891113,
|
||||
"pii_count": 36
|
||||
},
|
||||
{
|
||||
"pdf": "010_simple_anapath_ANAPATH_23217289.pdf",
|
||||
"time_s": 0.39705705642700195,
|
||||
"pii_count": 54
|
||||
},
|
||||
{
|
||||
"pdf": "011_moyen_compte_rendu_CRH_23080179.pdf",
|
||||
"time_s": 1.0042967796325684,
|
||||
"pii_count": 46
|
||||
},
|
||||
{
|
||||
"pdf": "012_moyen_compte_rendu_CRH_692_23200418.pdf",
|
||||
"time_s": 0.8403730392456055,
|
||||
"pii_count": 103
|
||||
},
|
||||
{
|
||||
"pdf": "013_moyen_compte_rendu_363_23085243_CRO.pdf",
|
||||
"time_s": 0.94016432762146,
|
||||
"pii_count": 160
|
||||
},
|
||||
{
|
||||
"pdf": "014_moyen_compte_rendu_CRO_23167029.redacted_raster.pdf",
|
||||
"time_s": 0.4384956359863281,
|
||||
"pii_count": 0
|
||||
},
|
||||
{
|
||||
"pdf": "015_moyen_unknown_CONSULTATION_ANESTHESISTE_23139653.pdf",
|
||||
"time_s": 0.9846677780151367,
|
||||
"pii_count": 25
|
||||
},
|
||||
{
|
||||
"pdf": "016_moyen_compte_rendu_CRH_23149905.pdf",
|
||||
"time_s": 1.4508278369903564,
|
||||
"pii_count": 242
|
||||
},
|
||||
{
|
||||
"pdf": "017_moyen_compte_rendu_CRO_23222062.redacted_raster.pdf",
|
||||
"time_s": 0.4350569248199463,
|
||||
"pii_count": 0
|
||||
},
|
||||
{
|
||||
"pdf": "018_moyen_compte_rendu_CRH_23042753.pdf",
|
||||
"time_s": 1.9062294960021973,
|
||||
"pii_count": 233
|
||||
},
|
||||
{
|
||||
"pdf": "019_moyen_compte_rendu_CRO_332_23049003.pdf",
|
||||
"time_s": 1.020752191543579,
|
||||
"pii_count": 161
|
||||
},
|
||||
{
|
||||
"pdf": "020_moyen_compte_rendu_CRO_23084754.redacted_raster.pdf",
|
||||
"time_s": 0.4804375171661377,
|
||||
"pii_count": 0
|
||||
},
|
||||
{
|
||||
"pdf": "021_moyen_compte_rendu_CRO_23201117.redacted_raster.pdf",
|
||||
"time_s": 0.31412649154663086,
|
||||
"pii_count": 0
|
||||
},
|
||||
{
|
||||
"pdf": "022_moyen_compte_rendu_cro2_516_23187028.pdf",
|
||||
"time_s": 0.37198877334594727,
|
||||
"pii_count": 29
|
||||
},
|
||||
{
|
||||
"pdf": "023_complexe_compte_rendu_CRH_23102610.pdf",
|
||||
"time_s": 4.054161310195923,
|
||||
"pii_count": 617
|
||||
},
|
||||
{
|
||||
"pdf": "024_complexe_trackare_trackare-17001141-23066188_17001141_23066188.pdf",
|
||||
"time_s": 8.550535917282104,
|
||||
"pii_count": 804
|
||||
},
|
||||
{
|
||||
"pdf": "025_complexe_trackare_trackare-02016820-23095226_02016820_23095226.pdf",
|
||||
"time_s": 17.83988666534424,
|
||||
"pii_count": 1622
|
||||
},
|
||||
{
|
||||
"pdf": "026_complexe_trackare_trackare-15000536-23074384_15000536_23074384.pdf",
|
||||
"time_s": 12.040966749191284,
|
||||
"pii_count": 1056
|
||||
},
|
||||
{
|
||||
"pdf": "027_complexe_trackare_trackare-10027557-23183041_10027557_23183041.pdf",
|
||||
"time_s": 8.782238721847534,
|
||||
"pii_count": 859
|
||||
}
|
||||
]
|
||||
}
|
||||
324
tests/ground_truth/pdfs/baseline_anonymized/batch_results.json
Normal file
324
tests/ground_truth/pdfs/baseline_anonymized/batch_results.json
Normal file
@@ -0,0 +1,324 @@
|
||||
{
|
||||
"date": "2026-03-02T10:29:28.280047",
|
||||
"total_documents": 27,
|
||||
"success_count": 25,
|
||||
"total_pii": 6395,
|
||||
"total_time_s": 65.55555844306946,
|
||||
"avg_time_s": 2.4279836460396096,
|
||||
"use_ner": true,
|
||||
"use_vlm": false,
|
||||
"results": [
|
||||
{
|
||||
"pdf": "001_simple_unknown_BACTERIO_23018396.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.38307929039001465,
|
||||
"pii_count": 43,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/001_simple_unknown_BACTERIO_23018396.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/001_simple_unknown_BACTERIO_23018396.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/001_simple_unknown_BACTERIO_23018396.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/001_simple_unknown_BACTERIO_23018396.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "002_simple_unknown_bacterio_476_23159413.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.7698535919189453,
|
||||
"pii_count": 47,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/002_simple_unknown_bacterio_476_23159413.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/002_simple_unknown_bacterio_476_23159413.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/002_simple_unknown_bacterio_476_23159413.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/002_simple_unknown_bacterio_476_23159413.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "003_simple_compte_rendu_CRO_23155084.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.41591382026672363,
|
||||
"pii_count": 25,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/003_simple_compte_rendu_CRO_23155084.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/003_simple_compte_rendu_CRO_23155084.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/003_simple_compte_rendu_CRO_23155084.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/003_simple_compte_rendu_CRO_23155084.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "004_simple_anapath_anapath_53_23224186.redacted_raster.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.3458268642425537,
|
||||
"pii_count": 0,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/004_simple_anapath_anapath_53_23224186.redacted_raster.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/004_simple_anapath_anapath_53_23224186.redacted_raster.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/004_simple_anapath_anapath_53_23224186.redacted_raster.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/004_simple_anapath_anapath_53_23224186.redacted_raster.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "005_simple_compte_rendu_CRH_23155836.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.8738148212432861,
|
||||
"pii_count": 140,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/005_simple_compte_rendu_CRH_23155836.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/005_simple_compte_rendu_CRH_23155836.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/005_simple_compte_rendu_CRH_23155836.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/005_simple_compte_rendu_CRH_23155836.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "006_simple_anapath_ANAPATH_23142660.pdf",
|
||||
"success": false,
|
||||
"time_s": 0.0017476081848144531,
|
||||
"error": ""
|
||||
},
|
||||
{
|
||||
"pdf": "007_simple_anapath_ANAPATH_23096332.pdf",
|
||||
"success": false,
|
||||
"time_s": 0.0013265609741210938,
|
||||
"error": ""
|
||||
},
|
||||
{
|
||||
"pdf": "008_simple_trackare_trackare-14004105-23202435_14004105_23202435.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.4308145046234131,
|
||||
"pii_count": 93,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/008_simple_trackare_trackare-14004105-23202435_14004105_23202435.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/008_simple_trackare_trackare-14004105-23202435_14004105_23202435.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/008_simple_trackare_trackare-14004105-23202435_14004105_23202435.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/008_simple_trackare_trackare-14004105-23202435_14004105_23202435.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "009_simple_compte_rendu_CRO_23051225.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.47577404975891113,
|
||||
"pii_count": 36,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/009_simple_compte_rendu_CRO_23051225.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/009_simple_compte_rendu_CRO_23051225.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/009_simple_compte_rendu_CRO_23051225.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/009_simple_compte_rendu_CRO_23051225.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "010_simple_anapath_ANAPATH_23217289.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.39705705642700195,
|
||||
"pii_count": 54,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/010_simple_anapath_ANAPATH_23217289.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/010_simple_anapath_ANAPATH_23217289.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/010_simple_anapath_ANAPATH_23217289.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/010_simple_anapath_ANAPATH_23217289.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "011_moyen_compte_rendu_CRH_23080179.pdf",
|
||||
"success": true,
|
||||
"time_s": 1.0042967796325684,
|
||||
"pii_count": 46,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/011_moyen_compte_rendu_CRH_23080179.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/011_moyen_compte_rendu_CRH_23080179.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/011_moyen_compte_rendu_CRH_23080179.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/011_moyen_compte_rendu_CRH_23080179.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "012_moyen_compte_rendu_CRH_692_23200418.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.8403730392456055,
|
||||
"pii_count": 103,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/012_moyen_compte_rendu_CRH_692_23200418.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/012_moyen_compte_rendu_CRH_692_23200418.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/012_moyen_compte_rendu_CRH_692_23200418.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/012_moyen_compte_rendu_CRH_692_23200418.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "013_moyen_compte_rendu_363_23085243_CRO.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.94016432762146,
|
||||
"pii_count": 160,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/013_moyen_compte_rendu_363_23085243_CRO.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/013_moyen_compte_rendu_363_23085243_CRO.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/013_moyen_compte_rendu_363_23085243_CRO.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/013_moyen_compte_rendu_363_23085243_CRO.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "014_moyen_compte_rendu_CRO_23167029.redacted_raster.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.4384956359863281,
|
||||
"pii_count": 0,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/014_moyen_compte_rendu_CRO_23167029.redacted_raster.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/014_moyen_compte_rendu_CRO_23167029.redacted_raster.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/014_moyen_compte_rendu_CRO_23167029.redacted_raster.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/014_moyen_compte_rendu_CRO_23167029.redacted_raster.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "015_moyen_unknown_CONSULTATION_ANESTHESISTE_23139653.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.9846677780151367,
|
||||
"pii_count": 25,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/015_moyen_unknown_CONSULTATION_ANESTHESISTE_23139653.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/015_moyen_unknown_CONSULTATION_ANESTHESISTE_23139653.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/015_moyen_unknown_CONSULTATION_ANESTHESISTE_23139653.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/015_moyen_unknown_CONSULTATION_ANESTHESISTE_23139653.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "016_moyen_compte_rendu_CRH_23149905.pdf",
|
||||
"success": true,
|
||||
"time_s": 1.4508278369903564,
|
||||
"pii_count": 242,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/016_moyen_compte_rendu_CRH_23149905.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/016_moyen_compte_rendu_CRH_23149905.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/016_moyen_compte_rendu_CRH_23149905.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/016_moyen_compte_rendu_CRH_23149905.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "017_moyen_compte_rendu_CRO_23222062.redacted_raster.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.4350569248199463,
|
||||
"pii_count": 0,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/017_moyen_compte_rendu_CRO_23222062.redacted_raster.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/017_moyen_compte_rendu_CRO_23222062.redacted_raster.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/017_moyen_compte_rendu_CRO_23222062.redacted_raster.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/017_moyen_compte_rendu_CRO_23222062.redacted_raster.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "018_moyen_compte_rendu_CRH_23042753.pdf",
|
||||
"success": true,
|
||||
"time_s": 1.9062294960021973,
|
||||
"pii_count": 233,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/018_moyen_compte_rendu_CRH_23042753.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/018_moyen_compte_rendu_CRH_23042753.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/018_moyen_compte_rendu_CRH_23042753.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/018_moyen_compte_rendu_CRH_23042753.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "019_moyen_compte_rendu_CRO_332_23049003.pdf",
|
||||
"success": true,
|
||||
"time_s": 1.020752191543579,
|
||||
"pii_count": 161,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/019_moyen_compte_rendu_CRO_332_23049003.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/019_moyen_compte_rendu_CRO_332_23049003.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/019_moyen_compte_rendu_CRO_332_23049003.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/019_moyen_compte_rendu_CRO_332_23049003.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "020_moyen_compte_rendu_CRO_23084754.redacted_raster.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.4804375171661377,
|
||||
"pii_count": 0,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/020_moyen_compte_rendu_CRO_23084754.redacted_raster.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/020_moyen_compte_rendu_CRO_23084754.redacted_raster.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/020_moyen_compte_rendu_CRO_23084754.redacted_raster.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/020_moyen_compte_rendu_CRO_23084754.redacted_raster.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "021_moyen_compte_rendu_CRO_23201117.redacted_raster.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.31412649154663086,
|
||||
"pii_count": 0,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/021_moyen_compte_rendu_CRO_23201117.redacted_raster.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/021_moyen_compte_rendu_CRO_23201117.redacted_raster.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/021_moyen_compte_rendu_CRO_23201117.redacted_raster.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/021_moyen_compte_rendu_CRO_23201117.redacted_raster.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "022_moyen_compte_rendu_cro2_516_23187028.pdf",
|
||||
"success": true,
|
||||
"time_s": 0.37198877334594727,
|
||||
"pii_count": 29,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/022_moyen_compte_rendu_cro2_516_23187028.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/022_moyen_compte_rendu_cro2_516_23187028.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/022_moyen_compte_rendu_cro2_516_23187028.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/022_moyen_compte_rendu_cro2_516_23187028.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "023_complexe_compte_rendu_CRH_23102610.pdf",
|
||||
"success": true,
|
||||
"time_s": 4.054161310195923,
|
||||
"pii_count": 617,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/023_complexe_compte_rendu_CRH_23102610.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/023_complexe_compte_rendu_CRH_23102610.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/023_complexe_compte_rendu_CRH_23102610.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/023_complexe_compte_rendu_CRH_23102610.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "024_complexe_trackare_trackare-17001141-23066188_17001141_23066188.pdf",
|
||||
"success": true,
|
||||
"time_s": 8.550535917282104,
|
||||
"pii_count": 804,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/024_complexe_trackare_trackare-17001141-23066188_17001141_23066188.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/024_complexe_trackare_trackare-17001141-23066188_17001141_23066188.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/024_complexe_trackare_trackare-17001141-23066188_17001141_23066188.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/024_complexe_trackare_trackare-17001141-23066188_17001141_23066188.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "025_complexe_trackare_trackare-02016820-23095226_02016820_23095226.pdf",
|
||||
"success": true,
|
||||
"time_s": 17.83988666534424,
|
||||
"pii_count": 1622,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/025_complexe_trackare_trackare-02016820-23095226_02016820_23095226.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/025_complexe_trackare_trackare-02016820-23095226_02016820_23095226.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/025_complexe_trackare_trackare-02016820-23095226_02016820_23095226.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/025_complexe_trackare_trackare-02016820-23095226_02016820_23095226.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "026_complexe_trackare_trackare-15000536-23074384_15000536_23074384.pdf",
|
||||
"success": true,
|
||||
"time_s": 12.040966749191284,
|
||||
"pii_count": 1056,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/026_complexe_trackare_trackare-15000536-23074384_15000536_23074384.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/026_complexe_trackare_trackare-15000536-23074384_15000536_23074384.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/026_complexe_trackare_trackare-15000536-23074384_15000536_23074384.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/026_complexe_trackare_trackare-15000536-23074384_15000536_23074384.redacted_raster.pdf"
|
||||
}
|
||||
},
|
||||
{
|
||||
"pdf": "027_complexe_trackare_trackare-10027557-23183041_10027557_23183041.pdf",
|
||||
"success": true,
|
||||
"time_s": 8.782238721847534,
|
||||
"pii_count": 859,
|
||||
"files": {
|
||||
"text": "tests/ground_truth/pdfs/baseline_anonymized/027_complexe_trackare_trackare-10027557-23183041_10027557_23183041.pseudonymise.txt",
|
||||
"audit": "tests/ground_truth/pdfs/baseline_anonymized/027_complexe_trackare_trackare-10027557-23183041_10027557_23183041.audit.jsonl",
|
||||
"pdf_vector": "tests/ground_truth/pdfs/baseline_anonymized/027_complexe_trackare_trackare-10027557-23183041_10027557_23183041.redacted_vector.pdf",
|
||||
"pdf_raster": "tests/ground_truth/pdfs/baseline_anonymized/027_complexe_trackare_trackare-10027557-23183041_10027557_23183041.redacted_raster.pdf"
|
||||
}
|
||||
}
|
||||
]
|
||||
}
|
||||
Reference in New Issue
Block a user