{"_id": {"$oid": "69d4eb12b877594bc5718a0f"}, "test_id": "T0386", "benchmark": "company_lists", "date": "2025-10-28", "tags": {"document-type": ["book-page"], "writing": ["printed"], "century": [20], "language": ["en", "de"], "layout": ["list"], "entry-type": ["company"], "task": ["information-extraction"]}, "contributors": ["lea_kasper", "sorin_marti"], "hidden": false, "config": {"provider": "mistral", "model": "mistral-medium-2505", "dataclass": "ListPage", "temperature": 0.5, "role_description": "You are a Historian", "prompt_file": "prompt_min.txt", "legacy_test": false}, "prompt": "- Answer in valid JSON.\n- The page ID is given as {page_id}.\n", "results": {"provider": "mistral", "model": "mistral-medium-2505", "duration": 8.428334474563599, "timestamp": "2025-10-28T09:43:28.113658", "parsed": {"page_id": "16", "entries": [{"entry_id": "1", "company_name": "F\u00e4rbereien Schetty, A.-G.", "location": "Basle"}, {"entry_id": "2", "company_name": "G. Kappeler A.-G.", "location": "Zofingen"}, {"entry_id": "3", "company_name": "J. A. Crabtree & Co., Ltd.", "location": "Walsall, England"}, {"entry_id": "4", "company_name": "Brown Boveri & Cie, A.-G.", "location": "Baden (Switzerland)"}, {"entry_id": "5", "company_name": "Brown Boveri & Cie, A.-G.", "location": "Baden (Switzerland)"}, {"entry_id": "6", "company_name": "Magn\u00e9tos Lucifer S.A.", "location": "Carouge-Gen\u00e8ve"}, {"entry_id": "7", "company_name": "Brown Boveri & Cie, A.-G.", "location": "Baden (Switzerland)"}, {"entry_id": "8", "company_name": "Brown Boveri & Cie, A.-G.", "location": "Baden (Switzerland)"}, {"entry_id": "9", "company_name": "Brown Boveri & Cie, A.-G.", "location": "Baden (Switzerland)"}, {"entry_id": "10", "company_name": "Brown Boveri & Cie, A.-G.", "location": "Baden (Switzerland)"}, {"entry_id": "11", "company_name": "Brown Boveri & Cie, A.-G.", "location": "Baden (Switzerland)"}, {"entry_id": "12", "company_name": "Brown Boveri & Cie, A.-G.", "location": "Baden (Switzerland)"}]}, "text": "", "raw_response": {"id": "ceafdf0b133a4fba89c0c96f8c0e1407", "model": "mistral-medium-2505", "choices": [{"finish_reason": "stop", "index": 0, "message": {"content": "{\n  \"page_id\": \"16\",\n  \"entries\": [\n    {\n      \"entry_id\": \"1\",\n      \"company_name\": \"F\u00e4rbereien Schetty, A.-G.\",\n      \"location\": \"Basle\"\n    },\n    {\n      \"entry_id\": \"2\",\n      \"company_name\": \"G. Kappeler A.-G.\",\n      \"location\": \"Zofingen\"\n    },\n    {\n      \"entry_id\": \"3\",\n      \"company_name\": \"J. A. Crabtree & Co., Ltd.\",\n      \"location\": \"Walsall, England\"\n    },\n    {\n      \"entry_id\": \"4\",\n      \"company_name\": \"Brown Boveri & Cie, A.-G.\",\n      \"location\": \"Baden (Switzerland)\"\n    },\n    {\n      \"entry_id\": \"5\",\n      \"company_name\": \"Brown Boveri & Cie, A.-G.\",\n      \"location\": \"Baden (Switzerland)\"\n    },\n    {\n      \"entry_id\": \"6\",\n      \"company_name\": \"Magn\u00e9tos Lucifer S.A.\",\n      \"location\": \"Carouge-Gen\u00e8ve\"\n    },\n    {\n      \"entry_id\": \"7\",\n      \"company_name\": \"Brown Boveri & Cie, A.-G.\",\n      \"location\": \"Baden (Switzerland)\"\n    },\n    {\n      \"entry_id\": \"8\",\n      \"company_name\": \"Brown Boveri & Cie, A.-G.\",\n      \"location\": \"Baden (Switzerland)\"\n    },\n    {\n      \"entry_id\": \"9\",\n      \"company_name\": \"Brown Boveri & Cie, A.-G.\",\n      \"location\": \"Baden (Switzerland)\"\n    },\n    {\n      \"entry_id\": \"10\",\n      \"company_name\": \"Brown Boveri & Cie, A.-G.\",\n      \"location\": \"Baden (Switzerland)\"\n    },\n    {\n      \"entry_id\": \"11\",\n      \"company_name\": \"Brown Boveri & Cie, A.-G.\",\n      \"location\": \"Baden (Switzerland)\"\n    },\n    {\n      \"entry_id\": \"12\",\n      \"company_name\": \"Brown Boveri & Cie, A.-G.\",\n      \"location\": \"Baden (Switzerland)\"\n    }\n  ]\n}", "role": "assistant"}}], "usage": {"prompt_tokens": 1154, "completion_tokens": 492, "total_tokens": 1646}}, "usage": {"input_tokens": 1154, "output_tokens": 492, "total_tokens": 1646}, "finish_reason": "stop"}, "scoring": {"f1_micro": 0.36032171581769434, "f1_macro": 0.3893333333333333, "micro_precision": 0.3848797250859107, "micro_recall": 0.3387096774193548, "total_instances": 15, "total_tp": 336, "total_fp": 537, "total_fn": 656, "cost_summary": {"total_input_tokens": 16156, "total_output_tokens": 11769, "total_tokens": 27925, "input_cost_usd": 0.006462, "output_cost_usd": 0.023538, "total_cost_usd": 0.03, "pricing_date": "2025-10-28", "input_price_per_million": 0.4, "output_price_per_million": 2.0}}, "normalized_score": 38.93333333333333}