{"_id": {"$oid": "6a26c67c3572c06bc1455d0c"}, "test_id": "T0795", "benchmark": "magazine_pages", "date": "2026-03-23", "tags": {"century": [20], "document-type": ["newspaper-page"], "language": ["en"], "layout": ["prose", "columns"], "script": ["latin"], "task": ["document-understanding"], "writing": ["printed"]}, "contributors": ["lea_kasper", "sorin_marti", "arno_bosse"], "hidden": false, "config": {"provider": "mistral", "model": "magistral-medium-2509", "dataclass": "MagazinePage", "temperature": 0.0, "role_description": "You are a historian with expertise in analyzing and summarizing historical magazine pages", "prompt_file": "prompt.txt", "legacy_test": false}, "prompt": "Extract all advertisements and return their bounding boxes.\nThe original size of the page is {width} x {height} pixels.", "results": {"text": "{\"advertisements\":[{\"box\":[162.0,189.0,492.0,348.0]},{\"box\":[162.0,408.0,492.0,567.0]},{\"box\":[162.0,627.0,492.0,786.0]},{\"box\":[162.0,846.0,492.0,1005.0]},{\"box\":[162.0,1065.0,492.0,1224.0]},{\"box\":[162.0,1284.0,492.0,1443.0]},{\"box\":[162.0,1503.0,492.0,1662.0]},{\"box\":[162.0,1722.0,492.0,1881.0]},{\"box\":[162.0,1941.0,492.0,2100.0]},{\"box\":[162.0,2160.0,492.0,2319.0]},{\"box\":[162.0,2379.0,492.0,2538.0]},{\"box\":[162.0,2598.0,492.0,2757.0]},{\"box\":[162.0,2817.0,492.0,2976.0]},{\"box\":[162.0,3036.0,492.0,3195.0]},{\"box\":[162.0,3255.0,492.0,3414.0]},{\"box\":[552.0,189.0,882.0,348.0]},{\"box\":[552.0,408.0,882.0,567.0]},{\"box\":[552.0,627.0,882.0,786.0]},{\"box\":[552.0,846.0,882.0,1005.0]},{\"box\":[552.0,1065.0,882.0,1224.0]},{\"box\":[552.0,1284.0,882.0,1443.0]},{\"box\":[552.0,1503.0,882.0,1662.0]},{\"box\":[552.0,1722.0,882.0,1881.0]},{\"box\":[552.0,1941.0,882.0,2100.0]},{\"box\":[552.0,2160.0,882.0,2319.0]},{\"box\":[552.0,2379.0,882.0,2538.0]},{\"box\":[552.0,2598.0,882.0,2757.0]},{\"box\":[552.0,2817.0,882.0,2976.0]},{\"box\":[552.0,3036.0,882.0,3195.0]},{\"box\":[552.0,3255.0,882.0,3414.0]},{\"box\":[942.0,189.0,1272.0,348.0]},{\"box\":[942.0,408.0,1272.0,567.0]},{\"box\":[942.0,627.0,1272.0,786.0]},{\"box\":[942.0,846.0,1272.0,1005.0]},{\"box\":[942.0,1065.0,1272.0,1224.0]},{\"box\":[942.0,1284.0,1272.0,1443.0]},{\"box\":[942.0,1503.0,1272.0,1662.0]},{\"box\":[942.0,1722.0,1272.0,1881.0]},{\"box\":[942.0,1941.0,1272.0,2100.0]},{\"box\":[942.0,2160.0,1272.0,2319.0]},{\"box\":[942.0,2379.0,1272.0,2538.0]},{\"box\":[942.0,2598.0,1272.0,2757.0]},{\"box\":[942.0,2817.0,1272.0,2976.0]},{\"box\":[942.0,3036.0,1272.0,3195.0]},{\"box\":[942.0,3255.0,1272.0,3414.0]},{\"box\":[1332.0,189.0,1662.0,348.0]},{\"box\":[1332.0,408.0,1662.0,567.0]},{\"box\":[1332.0,627.0,1662.0,786.0]},{\"box\":[1332.0,846.0,1662.0,1005.0]},{\"box\":[1332.0,1065.0,1662.0,1224.0]},{\"box\":[1332.0,1284.0,1662.0,1443.0]},{\"box\":[1332.0,1503.0,1662.0,1662.0]},{\"box\":[1332.0,1722.0,1662.0,1881.0]},{\"box\":[1332.0,1941.0,1662.0,2100.0]},{\"box\":[1332.0,2160.0,1662.0,2319.0]},{\"box\":[1332.0,2379.0,1662.0,2538.0]},{\"box\":[1332.0,2598.0,1662.0,2757.0]},{\"box\":[1332.0,2817.0,1662.0,2976.0]},{\"box\":[1332.0,3036.0,1662.0,3195.0]},{\"box\":[1332.0,3255.0,1662.0,3414.0]},{\"box\":[1722.0,189.0,2052.0,348.0]},{\"box\":[1722.0,408.0,2052.0,567.0]},{\"box\":[1722.0,627.0,2052.0,786.0]},{\"box\":[1722.0,846.0,2052.0,1005.0]},{\"box\":[1722.0,1065.0,2052.0,1224.0]},{\"box\":[1722.0,1284.0,2052.0,1443.0]},{\"box\":[1722.0,1503.0,2052.0,1662.0]},{\"box\":[1722.0,1722.0,2052.0,1881.0]},{\"box\":[1722.0,1941.0,2052.0,2100.0]},{\"box\":[1722.0,2160.0,2052.0,2319.0]},{\"box\":[1722.0,2379.0,2052.0,2538.0]},{\"box\":[1722.0,2598.0,2052.0,2757.0]},{\"box\":[1722.0,2817.0,2052.0,2976.0]},{\"box\":[1722.0,3036.0,2052.0,3195.0]},{\"box\":[1722.0,3255.0,2052.0,3414.0]},{\"box\":[2112.0,189.0,2442.0,348.0]},{\"box\":[2112.0,408.0,2442.0,567.0]},{\"box\":[2112.0,627.0,2442.0,786.0]},{\"box\":[2112.0,846.0,2442.0,1005.0]},{\"box\":[2112.0,1065.0,2442.0,1224.0]},{\"box\":[2112.0,1284.0,2442.0,1443.0]},{\"box\":[2112.0,1503.0,2442.0,1662.0]},{\"box\":[2112.0,1722.0,2442.0,1881.0]},{\"box\":[2112.0,1941.0,2442.0,2100.0]},{\"box\":[2112.0,2160.0,2442.0,2319.0]},{\"box\":[2112.0,2379.0,2442.0,2538.0]},{\"box\":[2112.0,2598.0,2442.0,2757.0]},{\"box\":[2112.0,2817.0,2442.0,2976.0]},{\"box\":[2112.0,3036.0,2442.0,3195.0]},{\"box\":[2112.0,3255.0,2442.0,3414.0]}]}", "model": "magistral-medium-2509", "provider": "mistral", "finish_reason": "stop", "usage": {"input_tokens": 254, "output_tokens": 2322, "total_tokens": 2576, "input_cost_usd": 0.000508, "output_cost_usd": 0.011609999999999999, "estimated_cost_usd": 0.012117999999999999}, "duration": 32.11439847946167, "timestamp": "2026-03-23T22:42:55.979513", "parsed": {"advertisements": [{"box": [162, 189, 492, 348]}, {"box": [162, 408, 492, 567]}, {"box": [162, 627, 492, 786]}, {"box": [162, 846, 492, 1005]}, {"box": [162, 1065, 492, 1224]}, {"box": [162, 1284, 492, 1443]}, {"box": [162, 1503, 492, 1662]}, {"box": [162, 1722, 492, 1881]}, {"box": [162, 1941, 492, 2100]}, {"box": [162, 2160, 492, 2319]}, {"box": [162, 2379, 492, 2538]}, {"box": [162, 2598, 492, 2757]}, {"box": [162, 2817, 492, 2976]}, {"box": [162, 3036, 492, 3195]}, {"box": [162, 3255, 492, 3414]}, {"box": [552, 189, 882, 348]}, {"box": [552, 408, 882, 567]}, {"box": [552, 627, 882, 786]}, {"box": [552, 846, 882, 1005]}, {"box": [552, 1065, 882, 1224]}, {"box": [552, 1284, 882, 1443]}, {"box": [552, 1503, 882, 1662]}, {"box": [552, 1722, 882, 1881]}, {"box": [552, 1941, 882, 2100]}, {"box": [552, 2160, 882, 2319]}, {"box": [552, 2379, 882, 2538]}, {"box": [552, 2598, 882, 2757]}, {"box": [552, 2817, 882, 2976]}, {"box": [552, 3036, 882, 3195]}, {"box": [552, 3255, 882, 3414]}, {"box": [942, 189, 1272, 348]}, {"box": [942, 408, 1272, 567]}, {"box": [942, 627, 1272, 786]}, {"box": [942, 846, 1272, 1005]}, {"box": [942, 1065, 1272, 1224]}, {"box": [942, 1284, 1272, 1443]}, {"box": [942, 1503, 1272, 1662]}, {"box": [942, 1722, 1272, 1881]}, {"box": [942, 1941, 1272, 2100]}, {"box": [942, 2160, 1272, 2319]}, {"box": [942, 2379, 1272, 2538]}, {"box": [942, 2598, 1272, 2757]}, {"box": [942, 2817, 1272, 2976]}, {"box": [942, 3036, 1272, 3195]}, {"box": [942, 3255, 1272, 3414]}, {"box": [1332, 189, 1662, 348]}, {"box": [1332, 408, 1662, 567]}, {"box": [1332, 627, 1662, 786]}, {"box": [1332, 846, 1662, 1005]}, {"box": [1332, 1065, 1662, 1224]}, {"box": [1332, 1284, 1662, 1443]}, {"box": [1332, 1503, 1662, 1662]}, {"box": [1332, 1722, 1662, 1881]}, {"box": [1332, 1941, 1662, 2100]}, {"box": [1332, 2160, 1662, 2319]}, {"box": [1332, 2379, 1662, 2538]}, {"box": [1332, 2598, 1662, 2757]}, {"box": [1332, 2817, 1662, 2976]}, {"box": [1332, 3036, 1662, 3195]}, {"box": [1332, 3255, 1662, 3414]}, {"box": [1722, 189, 2052, 348]}, {"box": [1722, 408, 2052, 567]}, {"box": [1722, 627, 2052, 786]}, {"box": [1722, 846, 2052, 1005]}, {"box": [1722, 1065, 2052, 1224]}, {"box": [1722, 1284, 2052, 1443]}, {"box": [1722, 1503, 2052, 1662]}, {"box": [1722, 1722, 2052, 1881]}, {"box": [1722, 1941, 2052, 2100]}, {"box": [1722, 2160, 2052, 2319]}, {"box": [1722, 2379, 2052, 2538]}, {"box": [1722, 2598, 2052, 2757]}, {"box": [1722, 2817, 2052, 2976]}, {"box": [1722, 3036, 2052, 3195]}, {"box": [1722, 3255, 2052, 3414]}, {"box": [2112, 189, 2442, 348]}, {"box": [2112, 408, 2442, 567]}, {"box": [2112, 627, 2442, 786]}, {"box": [2112, 846, 2442, 1005]}, {"box": [2112, 1065, 2442, 1224]}, {"box": [2112, 1284, 2442, 1443]}, {"box": [2112, 1503, 2442, 1662]}, {"box": [2112, 1722, 2442, 1881]}, {"box": [2112, 1941, 2442, 2100]}, {"box": [2112, 2160, 2442, 2319]}, {"box": [2112, 2379, 2442, 2538]}, {"box": [2112, 2598, 2442, 2757]}, {"box": [2112, 2817, 2442, 2976]}, {"box": [2112, 3036, 2442, 3195]}, {"box": [2112, 3255, 2442, 3414]}]}, "conversation_id": "a30dd686-64e3-4707-aaa7-4871a3e8595c", "score": {"f1": 0.0, "precision": 0.0, "recall": 0.0, "mean_iou": 0.0, "true_positives": 0, "false_positives": 90, "false_negatives": 2, "iou_threshold": 0.5}, "raw_response": "{\"id\":\"09cb086a291f4145812c3ab2b9e70b33\",\"object\":\"chat.completion\",\"model\":\"magistral-medium-2509\",\"usage\":{\"prompt_tokens\":254,\"completion_tokens\":2322,\"total_tokens\":2576,\"prompt_tokens_details\":{\"cached_tokens\":233}},\"created\":1774302145,\"choices\":[{\"index\":0,\"message\":{\"role\":\"assistant\",\"content\":\"{\\\"advertisements\\\": [{\\\"box\\\": [162, 189, 492, 348]}, {\\\"box\\\": [162, 408, 492, 567]}, {\\\"box\\\": [162, 627, 492, 786]}, {\\\"box\\\": [162, 846, 492, 1005]}, {\\\"box\\\": [162, 1065, 492, 1224]}, {\\\"box\\\": [162, 1284, 492, 1443]}, {\\\"box\\\": [162, 1503, 492, 1662]}, {\\\"box\\\": [162, 1722, 492, 1881]}, {\\\"box\\\": [162, 1941, 492, 2100]}, {\\\"box\\\": [162, 2160, 492, 2319]}, {\\\"box\\\": [162, 2379, 492, 2538]}, {\\\"box\\\": [162, 2598, 492, 2757]}, {\\\"box\\\": [162, 2817, 492, 2976]}, {\\\"box\\\": [162, 3036, 492, 3195]}, {\\\"box\\\": [162, 3255, 492, 3414]}, {\\\"box\\\": [552, 189, 882, 348]}, {\\\"box\\\": [552, 408, 882, 567]}, {\\\"box\\\": [552, 627, 882, 786]}, {\\\"box\\\": [552, 846, 882, 1005]}, {\\\"box\\\": [552, 1065, 882, 1224]}, {\\\"box\\\": [552, 1284, 882, 1443]}, {\\\"box\\\": [552, 1503, 882, 1662]}, {\\\"box\\\": [552, 1722, 882, 1881]}, {\\\"box\\\": [552, 1941, 882, 2100]}, {\\\"box\\\": [552, 2160, 882, 2319]}, {\\\"box\\\": [552, 2379, 882, 2538]}, {\\\"box\\\": [552, 2598, 882, 2757]}, {\\\"box\\\": [552, 2817, 882, 2976]}, {\\\"box\\\": [552, 3036, 882, 3195]}, {\\\"box\\\": [552, 3255, 882, 3414]}, {\\\"box\\\": [942, 189, 1272, 348]}, {\\\"box\\\": [942, 408, 1272, 567]}, {\\\"box\\\": [942, 627, 1272, 786]}, {\\\"box\\\": [942, 846, 1272, 1005]}, {\\\"box\\\": [942, 1065, 1272, 1224]}, {\\\"box\\\": [942, 1284, 1272, 1443]}, {\\\"box\\\": [942, 1503, 1272, 1662]}, {\\\"box\\\": [942, 1722, 1272, 1881]}, {\\\"box\\\": [942, 1941, 1272, 2100]}, {\\\"box\\\": [942, 2160, 1272, 2319]}, {\\\"box\\\": [942, 2379, 1272, 2538]}, {\\\"box\\\": [942, 2598, 1272, 2757]}, {\\\"box\\\": [942, 2817, 1272, 2976]}, {\\\"box\\\": [942, 3036, 1272, 3195]}, {\\\"box\\\": [942, 3255, 1272, 3414]}, {\\\"box\\\": [1332, 189, 1662, 348]}, {\\\"box\\\": [1332, 408, 1662, 567]}, {\\\"box\\\": [1332, 627, 1662, 786]}, {\\\"box\\\": [1332, 846, 1662, 1005]}, {\\\"box\\\": [1332, 1065, 1662, 1224]}, {\\\"box\\\": [1332, 1284, 1662, 1443]}, {\\\"box\\\": [1332, 1503, 1662, 1662]}, {\\\"box\\\": [1332, 1722, 1662, 1881]}, {\\\"box\\\": [1332, 1941, 1662, 2100]}, {\\\"box\\\": [1332, 2160, 1662, 2319]}, {\\\"box\\\": [1332, 2379, 1662, 2538]}, {\\\"box\\\": [1332, 2598, 1662, 2757]}, {\\\"box\\\": [1332, 2817, 1662, 2976]}, {\\\"box\\\": [1332, 3036, 1662, 3195]}, {\\\"box\\\": [1332, 3255, 1662, 3414]}, {\\\"box\\\": [1722, 189, 2052, 348]}, {\\\"box\\\": [1722, 408, 2052, 567]}, {\\\"box\\\": [1722, 627, 2052, 786]}, {\\\"box\\\": [1722, 846, 2052, 1005]}, {\\\"box\\\": [1722, 1065, 2052, 1224]}, {\\\"box\\\": [1722, 1284, 2052, 1443]}, {\\\"box\\\": [1722, 1503, 2052, 1662]}, {\\\"box\\\": [1722, 1722, 2052, 1881]}, {\\\"box\\\": [1722, 1941, 2052, 2100]}, {\\\"box\\\": [1722, 2160, 2052, 2319]}, {\\\"box\\\": [1722, 2379, 2052, 2538]}, {\\\"box\\\": [1722, 2598, 2052, 2757]}, {\\\"box\\\": [1722, 2817, 2052, 2976]}, {\\\"box\\\": [1722, 3036, 2052, 3195]}, {\\\"box\\\": [1722, 3255, 2052, 3414]}, {\\\"box\\\": [2112, 189, 2442, 348]}, {\\\"box\\\": [2112, 408, 2442, 567]}, {\\\"box\\\": [2112, 627, 2442, 786]}, {\\\"box\\\": [2112, 846, 2442, 1005]}, {\\\"box\\\": [2112, 1065, 2442, 1224]}, {\\\"box\\\": [2112, 1284, 2442, 1443]}, {\\\"box\\\": [2112, 1503, 2442, 1662]}, {\\\"box\\\": [2112, 1722, 2442, 1881]}, {\\\"box\\\": [2112, 1941, 2442, 2100]}, {\\\"box\\\": [2112, 2160, 2442, 2319]}, {\\\"box\\\": [2112, 2379, 2442, 2538]}, {\\\"box\\\": [2112, 2598, 2442, 2757]}, {\\\"box\\\": [2112, 2817, 2442, 2976]}, {\\\"box\\\": [2112, 3036, 2442, 3195]}, {\\\"box\\\": [2112, 3255, 2442, 3414]}]}\",\"tool_calls\":null,\"prefix\":false},\"finish_reason\":\"stop\"}]}"}, "scoring": {"f1": 0.0, "precision": 0.0, "recall": 0.0, "mean_iou": 0.0, "true_positives": 0, "false_positives": 1842, "false_negatives": 126, "num_pages": 46, "cost_summary": {"total_input_tokens": 5080, "total_output_tokens": 47515, "total_tokens": 52595, "input_cost_usd": 0.010159999999999997, "output_cost_usd": 0.23757500000000004, "total_cost_usd": 0.24773499999999993}}, "normalized_score": 0}