{"_id": {"$oid": "69d4eb12b877594bc5718a0d"}, "test_id": "T0346", "benchmark": "company_lists", "date": "2025-10-28", "tags": {"document-type": ["book-page"], "writing": ["printed"], "century": [20], "language": ["en", "de"], "layout": ["list"], "entry-type": ["company"], "task": ["information-extraction"]}, "contributors": ["lea_kasper", "sorin_marti"], "hidden": false, "config": {"provider": "openai", "model": "gpt-4.1-nano", "dataclass": "ListPage", "temperature": 0.5, "role_description": "You are a Historian", "prompt_file": "prompt_min.txt", "legacy_test": false}, "prompt": "- Answer in valid JSON.\n- The page ID is given as {page_id}.\n", "results": {"provider": "openai", "model": "gpt-4.1-nano", "duration": 2.499525547027588, "timestamp": "2025-10-28T09:49:39.968203", "parsed": {"page_id": "{page_id}", "entries": [{"entry_id": "1", "company_name": "Hultons Press Ltd.", "location": "London"}, {"entry_id": "2", "company_name": "George Fischer Ltd.", "location": "Schaffhausen"}, {"entry_id": "3", "company_name": "Louis Martin", "location": "Lausanne"}, {"entry_id": "4", "company_name": "Techag Ltd.", "location": "Zurich"}, {"entry_id": "5", "company_name": "Usine Fega", "location": "Zurich"}, {"entry_id": "6", "company_name": "R. Amiguet-Peter", "location": "Lausanne"}]}, "text": "", "raw_response": {"id": "chatcmpl-CVZgZW1SXZ624NkJp0ifRMyuiR3JS", "model": "gpt-4.1-nano-2025-04-14", "choices": [{"finish_reason": "stop", "index": 0, "message": {"content": "{\"page_id\":\"{page_id}\",\"entries\":[{\"entry_id\":\"1\",\"company_name\":\"Hultons Press Ltd.\",\"location\":\"London\"},{\"entry_id\":\"2\",\"company_name\":\"George Fischer Ltd.\",\"location\":\"Schaffhausen\"},{\"entry_id\":\"3\",\"company_name\":\"Louis Martin\",\"location\":\"Lausanne\"},{\"entry_id\":\"4\",\"company_name\":\"Techag Ltd.\",\"location\":\"Zurich\"},{\"entry_id\":\"5\",\"company_name\":\"Usine Fega\",\"location\":\"Zurich\"},{\"entry_id\":\"6\",\"company_name\":\"R. Amiguet-Peter\",\"location\":\"Lausanne\"}]}", "role": "assistant"}}], "usage": {"prompt_tokens": 1962, "completion_tokens": 123, "total_tokens": 2085}}, "usage": {"input_tokens": 1962, "output_tokens": 123, "total_tokens": 2085}, "finish_reason": "stop"}, "scoring": {"f1_micro": 0.3530037214247741, "f1_macro": 0.30066666666666664, "micro_precision": 0.3734533183352081, "micro_recall": 0.3346774193548387, "total_instances": 15, "total_tp": 332, "total_fp": 557, "total_fn": 660, "cost_summary": {"total_input_tokens": 28248, "total_output_tokens": 7158, "total_tokens": 35406, "input_cost_usd": 0.002825, "output_cost_usd": 0.002863, "total_cost_usd": 0.005688, "pricing_date": "2025-10-28", "input_price_per_million": 0.1, "output_price_per_million": 0.4}}, "normalized_score": 30.066666666666663}