{"_id": {"$oid": "69d4eb12b877594bc5718a23"}, "test_id": "T0352", "benchmark": "company_lists", "date": "2025-10-28", "tags": {"document-type": ["book-page"], "writing": ["printed"], "century": [20], "language": ["en", "de"], "layout": ["list"], "entry-type": ["company"], "task": ["information-extraction"]}, "contributors": ["lea_kasper", "sorin_marti"], "hidden": false, "config": {"provider": "openai", "model": "gpt-5-nano", "dataclass": "ListPage", "temperature": 0.5, "role_description": "You are a Historian", "prompt_file": "prompt_min.txt", "legacy_test": false}, "prompt": "- Answer in valid JSON.\n- The page ID is given as {page_id}.\n", "results": {"provider": "openai", "model": "gpt-5-nano", "duration": 24.08856964111328, "timestamp": "2025-10-28T10:31:40.374117", "parsed": {"page_id": "{page_id}", "entries": [{"entry_id": "E1", "company_name": "Adolphe Saurer S.A.", "location": "Arbon"}, {"entry_id": "E2", "company_name": "The North British Rubber Co (Continental) Ltd.", "location": "Zurich"}, {"entry_id": "E3", "company_name": "Church Street Manufacturing Co., Ltd.", "location": "Great Harwood"}, {"entry_id": "E4", "company_name": "Thomas Adams, Ltd.", "location": "Nottingham"}, {"entry_id": "E5", "company_name": "Brown Boveri & Cie., A.-G.", "location": "Baden, Switzerland"}, {"entry_id": "E6", "company_name": "Nova Knitting Works, Siegrist & Co.", "location": "Oftringen"}, {"entry_id": "E7", "company_name": "Bigar Fr\u00e8res (Grands Magasins Innovation S.A.)", "location": "Lausanne"}, {"entry_id": "E8", "company_name": "Bonnard & Cie., S.A.", "location": "Lausanne"}, {"entry_id": "E9", "company_name": "Fr. Sauter A.-G.", "location": "Basle"}, {"entry_id": "E10", "company_name": "John Layton & Co., Ltd.", "location": "Zurich"}, {"entry_id": "E11", "company_name": "Cunard Steam Ship Co., Ltd.", "location": "Lucerne"}]}, "text": "", "raw_response": {"id": "chatcmpl-CVaKtz2uGvU4OSe40aTN2qdtHfT1Q", "model": "gpt-5-nano-2025-08-07", "choices": [{"finish_reason": "stop", "index": 0, "message": {"content": "{\"page_id\":\"{page_id}\",\"entries\":[{\"entry_id\":\"E1\",\"company_name\":\"Adolphe Saurer S.A.\",\"location\":\"Arbon\"},{\"entry_id\":\"E2\",\"company_name\":\"The North British Rubber Co (Continental) Ltd.\",\"location\":\"Zurich\"},{\"entry_id\":\"E3\",\"company_name\":\"Church Street Manufacturing Co., Ltd.\",\"location\":\"Great Harwood\"},{\"entry_id\":\"E4\",\"company_name\":\"Thomas Adams, Ltd.\",\"location\":\"Nottingham\"},{\"entry_id\":\"E5\",\"company_name\":\"Brown Boveri & Cie., A.-G.\",\"location\":\"Baden, Switzerland\"},{\"entry_id\":\"E6\",\"company_name\":\"Nova Knitting Works, Siegrist & Co.\",\"location\":\"Oftringen\"},{\"entry_id\":\"E7\",\"company_name\":\"Bigar Fr\u00e8res (Grands Magasins Innovation S.A.)\",\"location\":\"Lausanne\"},{\"entry_id\":\"E8\",\"company_name\":\"Bonnard & Cie., S.A.\",\"location\":\"Lausanne\"},{\"entry_id\":\"E9\",\"company_name\":\"Fr. Sauter A.-G.\",\"location\":\"Basle\"},{\"entry_id\":\"E10\",\"company_name\":\"John Layton & Co., Ltd.\",\"location\":\"Zurich\"},{\"entry_id\":\"E11\",\"company_name\":\"Cunard Steam Ship Co., Ltd.\",\"location\":\"Lucerne\"}]}", "role": "assistant"}}], "usage": {"prompt_tokens": 1202, "completion_tokens": 2851, "total_tokens": 4053}}, "usage": {"input_tokens": 1202, "output_tokens": 2851, "total_tokens": 4053}, "finish_reason": "stop"}, "scoring": {"f1_micro": 0.27167630057803466, "f1_macro": 0.2613333333333333, "micro_precision": 0.31842818428184283, "micro_recall": 0.2368951612903226, "total_instances": 15, "total_tp": 235, "total_fp": 503, "total_fn": 757, "cost_summary": {"total_input_tokens": 18030, "total_output_tokens": 66338, "total_tokens": 84368, "input_cost_usd": 0.000902, "output_cost_usd": 0.026535, "total_cost_usd": 0.027437, "pricing_date": "2025-10-28", "input_price_per_million": 0.05, "output_price_per_million": 0.4}}, "normalized_score": 26.13333333333333}