{"_id": {"$oid": "6a2c86a59ede3a3eff37d49a"}, "test_id": "T1084", "benchmark": "company_lists", "date": "2026-06-04", "tags": {"document-type": ["book-page"], "writing": ["printed"], "century": [20], "language": ["en", "de"], "layout": ["list"], "entry-type": ["company"], "task": ["information-extraction"]}, "contributors": ["lea_kasper", "sorin_marti"], "hidden": false, "config": {"provider": "anthropic", "model": "claude-opus-4-8", "dataclass": "ListPage", "temperature": 0.5, "role_description": "You are a Historian", "prompt_file": "prompt.txt", "legacy_test": false}, "prompt": "The image you are presented with stems from a digitized book containing lists of companies.\nYour task is to extract structured information about each company listed on the page.\n\nAbout the source:\n- The image stems from a trade index of the British Swiss Chamber of Commerce.\n- The image can show an alphabetical or a thematic list of companies.\n- The companies are mostly located in Switzerland and the UK.\n- The image stems from a trade index between 1925 and 1958.\n- Most pages have one column but some years have two columns.\n- The source itself is in English and German but the company names can be in English, German, French or Italian.\n\nAbout the entries:\n- Each entry describes a single company or person.\n- Alphabetical entries have filling dots between the company name and the page number. Dots and page numbers are not part of the data and should be ignored.\n- Alphabetical entries seldom to never have locations.\n- Thematic entries often have locations.\n- Thematic entries are listed under headings that describe the type of business.\n- Some thematic headings are only references to other headings, e.g. \"X, s. Y\".\n\nAbout the output:\n- Answer in valid JSON. The JSON should be an array of objects with the following fields:\n- The page ID is given as {page_id}.\n- Do not add country information, if it is not directly written with the location.\n\n{\n  \"entry_id\": \"A unique identifier for the entry, e.g. '{page_id}-1'\",\n  \"company_name\": \"The name of the company or person\",\n  \"location\": \"The location of the company, e.g. 'Zurich' or 'London, UK'. If no location is given, set to null.\"\n  ]\n}\n", "results": {"text": "{\"page_id\":\"89\",\"entries\":[{\"entry_id\":\"89-1\",\"company_name\":\"C. Troeber-Ruesch (agent for textile machinery)\",\"location\":\"K\u00fcsnacht (Zurich)\"},{\"entry_id\":\"89-2\",\"company_name\":\"Unitraco Ltd. (Importers)\",\"location\":\"Zurich\"},{\"entry_id\":\"89-3\",\"company_name\":\"H. Ursprung (Importer and Exporter)\",\"location\":\"Zurich\"},{\"entry_id\":\"89-4\",\"company_name\":\"Wettler & Frey (Machinery for contractors, including shovels, cranes, crushing and screening)\",\"location\":\"Zurich\"},{\"entry_id\":\"89-5\",\"company_name\":\"Paul W\u00fcthrich\",\"location\":\"Lausanne\"},{\"entry_id\":\"89-6\",\"company_name\":\"Hultons Press Ltd. (Periodicals and Magazines)\",\"location\":\"London E.C.4\"},{\"entry_id\":\"89-7\",\"company_name\":\"George Fischer Ltd.\",\"location\":\"Schaffhausen\"},{\"entry_id\":\"89-8\",\"company_name\":\"Louis Martin (Importer and agent for Inboard and Outboard Motors)\",\"location\":\"Lausanne\"},{\"entry_id\":\"89-9\",\"company_name\":\"Techag Ltd.\",\"location\":\"Zurich\"},{\"entry_id\":\"89-10\",\"company_name\":\"Usine Fega\",\"location\":\"Zurich\"},{\"entry_id\":\"89-11\",\"company_name\":\"R. Amiguet-Peter (importer)\",\"location\":\"Lausanne\"}]}", "model": "claude-opus-4-8", "provider": "anthropic", "finish_reason": "tool_use", "usage": {"input_tokens": 4979, "output_tokens": 601, "total_tokens": 5580, "input_cost_usd": 0.024895, "output_cost_usd": 0.015025, "estimated_cost_usd": 0.03992}, "duration": 8.016093730926514, "timestamp": "2026-06-04T11:32:19.919940", "parsed": {"page_id": "89", "entries": [{"entry_id": "89-1", "company_name": "C. Troeber-Ruesch (agent for textile machinery)", "location": "K\u00fcsnacht (Zurich)"}, {"entry_id": "89-2", "company_name": "Unitraco Ltd. (Importers)", "location": "Zurich"}, {"entry_id": "89-3", "company_name": "H. Ursprung (Importer and Exporter)", "location": "Zurich"}, {"entry_id": "89-4", "company_name": "Wettler & Frey (Machinery for contractors, including shovels, cranes, crushing and screening)", "location": "Zurich"}, {"entry_id": "89-5", "company_name": "Paul W\u00fcthrich", "location": "Lausanne"}, {"entry_id": "89-6", "company_name": "Hultons Press Ltd. (Periodicals and Magazines)", "location": "London E.C.4"}, {"entry_id": "89-7", "company_name": "George Fischer Ltd.", "location": "Schaffhausen"}, {"entry_id": "89-8", "company_name": "Louis Martin (Importer and agent for Inboard and Outboard Motors)", "location": "Lausanne"}, {"entry_id": "89-9", "company_name": "Techag Ltd.", "location": "Zurich"}, {"entry_id": "89-10", "company_name": "Usine Fega", "location": "Zurich"}, {"entry_id": "89-11", "company_name": "R. Amiguet-Peter (importer)", "location": "Lausanne"}]}, "conversation_id": "4cd77c9a-94d1-4abc-8921-980c405ea2e3", "score": {"f1_score": 0.41, "precision": 0.4117647058823529, "recall": 0.4117647058823529, "true_positives": 14, "false_positives": 20, "false_negatives": 20, "field_scores": {"entries[1].location": {"response": "Zurich", "ground_truth": "Zurich", "score": 1.0}, "entries[0].company_name": {"response": "C. Troeber-Ruesch (agent for textile machinery)", "ground_truth": "C. Troeber-Ruesch", "score": 0.53125}, "entries[8].company_name": {"response": "Techag Ltd.", "ground_truth": "Techag Ltd.", "score": 1.0}, "entries[8].entry_id": {"response": "89-9", "ground_truth": "156089_1321097_125-9", "score": 0.33333333333333337}, "entries[10].location": {"response": "Lausanne", "ground_truth": "Lausanne", "score": 1.0}, "entries[2].location": {"response": "Zurich", "ground_truth": "Zurich", "score": 1.0}, "entries[3].entry_id": {"response": "89-4", "ground_truth": "156089_1321097_125-4", "score": 0.33333333333333337}, "page_id": {"response": "89", "ground_truth": "156089_1321097_125", "score": 0.19999999999999996}, "entries[4].location": {"response": "Lausanne", "ground_truth": "Lausanne", "score": 1.0}, "entries[2].entry_id": {"response": "89-3", "ground_truth": "156089_1321097_125-3", "score": 0.33333333333333337}, "entries[3].location": {"response": "Zurich", "ground_truth": "Zurich 6", "score": 0.8571428571428572}, "entries[5].entry_id": {"response": "89-6", "ground_truth": "156089_1321097_125-6", "score": 0.33333333333333337}, "entries[3].company_name": {"response": "Wettler & Frey (Machinery for contractors, including shovels, cranes, crushing and screening)", "ground_truth": "Wettler & Frey", "score": 0.26168224299065423}, "entries[1].entry_id": {"response": "89-2", "ground_truth": "156089_1321097_125-2", "score": 0.33333333333333337}, "entries[6].location": {"response": "Schaffhausen", "ground_truth": "Schaffhausen", "score": 1.0}, "entries[0].location": {"response": "K\u00fcsnacht (Zurich)", "ground_truth": "K\u00fcsnacht (Zurich)", "score": 1.0}, "entries[4].company_name": {"response": "Paul W\u00fcthrich", "ground_truth": "Paul W\u00fcthrich", "score": 1.0}, "entries[5].location": {"response": "London E.C.4", "ground_truth": "London E. C. 4", "score": 0.923076923076923}, "entries[0].entry_id": {"response": "89-1", "ground_truth": "156089_1321097_125-1", "score": 0.33333333333333337}, "entries[9].entry_id": {"response": "89-10", "ground_truth": "156089_1321097_125-10", "score": 0.3846153846153846}, "entries[6].entry_id": {"response": "89-7", "ground_truth": "156089_1321097_125-7", "score": 0.33333333333333337}, "entries[9].company_name": {"response": "Usine Fega", "ground_truth": "Usine Fega", "score": 1.0}, "entries[6].company_name": {"response": "George Fischer Ltd.", "ground_truth": "George Fischer Ltd.", "score": 1.0}, "entries[1].company_name": {"response": "Unitraco Ltd. (Importers)", "ground_truth": "Unitraco Ltd.", "score": 0.6842105263157895}, "entries[5].company_name": {"response": "Hultons Press Ltd. (Periodicals and Magazines)", "ground_truth": "Hultons Press Ltd.", "score": 0.5625}, "entries[7].company_name": {"response": "Louis Martin (Importer and agent for Inboard and Outboard Motors)", "ground_truth": "Louis Martin", "score": 0.3116883116883117}, "entries[7].location": {"response": "Lausanne", "ground_truth": "Lausanne", "score": 1.0}, "entries[2].company_name": {"response": "H. Ursprung (Importer and Exporter)", "ground_truth": "H. Ursprung", "score": 0.4782608695652174}, "entries[4].entry_id": {"response": "89-5", "ground_truth": "156089_1321097_125-5", "score": 0.33333333333333337}, "entries[8].location": {"response": "Zurich", "ground_truth": "Zurich", "score": 1.0}, "entries[10].company_name": {"response": "R. Amiguet-Peter (importer)", "ground_truth": "R. Amiguet-Peter", "score": 0.7441860465116279}, "entries[7].entry_id": {"response": "89-8", "ground_truth": "156089_1321097_125-8", "score": 0.33333333333333337}, "entries[9].location": {"response": "Zurich", "ground_truth": "Zurich", "score": 1.0}, "entries[10].entry_id": {"response": "89-11", "ground_truth": "156089_1321097_125-11", "score": 0.3846153846153846}}, "total_fields": 34}, "raw_response": "{\"id\":\"msg_01QUy34sNbFb2eHjh53V7eGu\",\"container\":null,\"content\":[{\"id\":\"toolu_01F8mWLM6ftxuhT9SFZccfb1\",\"caller\":{\"type\":\"direct\"},\"input\":{\"page_id\":\"89\",\"entries\":[{\"entry_id\":\"89-1\",\"company_name\":\"C. Troeber-Ruesch (agent for textile machinery)\",\"location\":\"K\u00fcsnacht (Zurich)\"},{\"entry_id\":\"89-2\",\"company_name\":\"Unitraco Ltd. (Importers)\",\"location\":\"Zurich\"},{\"entry_id\":\"89-3\",\"company_name\":\"H. Ursprung (Importer and Exporter)\",\"location\":\"Zurich\"},{\"entry_id\":\"89-4\",\"company_name\":\"Wettler & Frey (Machinery for contractors, including shovels, cranes, crushing and screening)\",\"location\":\"Zurich\"},{\"entry_id\":\"89-5\",\"company_name\":\"Paul W\u00fcthrich\",\"location\":\"Lausanne\"},{\"entry_id\":\"89-6\",\"company_name\":\"Hultons Press Ltd. (Periodicals and Magazines)\",\"location\":\"London E.C.4\"},{\"entry_id\":\"89-7\",\"company_name\":\"George Fischer Ltd.\",\"location\":\"Schaffhausen\"},{\"entry_id\":\"89-8\",\"company_name\":\"Louis Martin (Importer and agent for Inboard and Outboard Motors)\",\"location\":\"Lausanne\"},{\"entry_id\":\"89-9\",\"company_name\":\"Techag Ltd.\",\"location\":\"Zurich\"},{\"entry_id\":\"89-10\",\"company_name\":\"Usine Fega\",\"location\":\"Zurich\"},{\"entry_id\":\"89-11\",\"company_name\":\"R. Amiguet-Peter (importer)\",\"location\":\"Lausanne\"}]},\"name\":\"extract_structured_data\",\"type\":\"tool_use\"}],\"model\":\"claude-opus-4-8\",\"role\":\"assistant\",\"stop_reason\":\"tool_use\",\"stop_sequence\":null,\"type\":\"message\",\"usage\":{\"cache_creation\":{\"ephemeral_1h_input_tokens\":0,\"ephemeral_5m_input_tokens\":0},\"cache_creation_input_tokens\":0,\"cache_read_input_tokens\":0,\"inference_geo\":\"global\",\"input_tokens\":4979,\"output_tokens\":601,\"server_tool_use\":null,\"service_tier\":\"standard\",\"output_tokens_details\":{\"thinking_tokens\":0}},\"stop_details\":null}"}, "scoring": {"f1_micro": 0.4260474507824331, "f1_macro": 0.4266666666666667, "micro_precision": 0.42669362992922144, "micro_recall": 0.4254032258064516, "total_instances": 15, "total_tp": 422, "total_fp": 567, "total_fn": 570, "cost_summary": {"total_input_tokens": 72983, "total_output_tokens": 18269, "total_tokens": 91252, "input_cost_usd": 0.36491500000000004, "output_cost_usd": 0.456725, "total_cost_usd": 0.8216399999999999}}, "normalized_score": 42.66666666666667}