{"_id": {"$oid": "69d4eb12b877594bc5718c8a"}, "test_id": "T0678", "benchmark": "company_lists", "date": "2026-03-16", "tags": {"document-type": ["book-page"], "writing": ["printed"], "century": [20], "language": ["en", "de"], "layout": ["list"], "entry-type": ["company"], "task": ["information-extraction"]}, "contributors": ["lea_kasper", "sorin_marti"], "hidden": false, "config": {"provider": "genai", "model": "gemini-3.1-flash-lite-preview", "dataclass": "ListPage", "temperature": 0.5, "role_description": "You are a Historian", "prompt_file": "prompt_min.txt", "legacy_test": false}, "prompt": "- Answer in valid JSON.\n- The page ID is given as {page_id}.\n", "results": {"text": "{\"page_id\":\"9\",\"entries\":[{\"entry_id\":\"1\",\"company_name\":\"Crowe & Co., Ltd.\",\"location\":\"Basle\"},{\"entry_id\":\"2\",\"company_name\":\"Imperial Airways Ltd.\",\"location\":\"Croydon\"},{\"entry_id\":\"3\",\"company_name\":\"Metallwerke A.G.\",\"location\":\"Dornach (Solothurn)\"},{\"entry_id\":\"4\",\"company_name\":\"Aluminium-Industrie-Aktien-Gesellschaft\",\"location\":\"Neuhausen\"},{\"entry_id\":\"5\",\"company_name\":\"Chemische Fabrik vorm. Sandoz\",\"location\":\"Basle\"},{\"entry_id\":\"6\",\"company_name\":\"Clayton Aniline Co., Ltd.\",\"location\":\"Manchester\"},{\"entry_id\":\"7\",\"company_name\":\"J. R. Geigy, A.-G.\",\"location\":\"Basle\"},{\"entry_id\":\"8\",\"company_name\":\"Society of Chemical Industry in Basle\",\"location\":\"Basle\"},{\"entry_id\":\"9\",\"company_name\":\"J. Hopf & Co.\",\"location\":\"Basle\"},{\"entry_id\":\"10\",\"company_name\":\"Rayon A.-G.\",\"location\":\"Arlesheim\"},{\"entry_id\":\"11\",\"company_name\":\"Banque F\u00e9d\u00e9rale S. A.\",\"location\":\"Vevey\"},{\"entry_id\":\"12\",\"company_name\":\"Barclays Bank Ltd.\",\"location\":\"London\"},{\"entry_id\":\"13\",\"company_name\":\"Galland & Co.\",\"location\":\"Lausanne\"},{\"entry_id\":\"14\",\"company_name\":\"Lloyds and National Provincial Foreign Bank, Ltd.\",\"location\":\"Geneva\"},{\"entry_id\":\"15\",\"company_name\":\"Swiss Bank Corporation\",\"location\":\"Basle\"},{\"entry_id\":\"16\",\"company_name\":\"Swiss Bank Corporation\",\"location\":\"Lausanne\"},{\"entry_id\":\"17\",\"company_name\":\"Wagons-Lits/Cook S. A.\",\"location\":\"Geneva\"}]}", "model": "gemini-3.1-flash-lite-preview", "provider": "genai", "finish_reason": "STOP", "usage": {"input_tokens": 1107, "output_tokens": 724, "total_tokens": 1831, "input_cost_usd": 0.00027675, "output_cost_usd": 0.0010860000000000002, "estimated_cost_usd": 0.0013627500000000002}, "duration": 7.913965940475464, "timestamp": "2026-03-16T19:09:59.538654", "parsed": {"page_id": "9", "entries": [{"entry_id": "1", "company_name": "Crowe & Co., Ltd.", "location": "Basle"}, {"entry_id": "2", "company_name": "Imperial Airways Ltd.", "location": "Croydon"}, {"entry_id": "3", "company_name": "Metallwerke A.G.", "location": "Dornach (Solothurn)"}, {"entry_id": "4", "company_name": "Aluminium-Industrie-Aktien-Gesellschaft", "location": "Neuhausen"}, {"entry_id": "5", "company_name": "Chemische Fabrik vorm. Sandoz", "location": "Basle"}, {"entry_id": "6", "company_name": "Clayton Aniline Co., Ltd.", "location": "Manchester"}, {"entry_id": "7", "company_name": "J. R. Geigy, A.-G.", "location": "Basle"}, {"entry_id": "8", "company_name": "Society of Chemical Industry in Basle", "location": "Basle"}, {"entry_id": "9", "company_name": "J. Hopf & Co.", "location": "Basle"}, {"entry_id": "10", "company_name": "Rayon A.-G.", "location": "Arlesheim"}, {"entry_id": "11", "company_name": "Banque F\u00e9d\u00e9rale S. A.", "location": "Vevey"}, {"entry_id": "12", "company_name": "Barclays Bank Ltd.", "location": "London"}, {"entry_id": "13", "company_name": "Galland & Co.", "location": "Lausanne"}, {"entry_id": "14", "company_name": "Lloyds and National Provincial Foreign Bank, Ltd.", "location": "Geneva"}, {"entry_id": "15", "company_name": "Swiss Bank Corporation", "location": "Basle"}, {"entry_id": "16", "company_name": "Swiss Bank Corporation", "location": "Lausanne"}, {"entry_id": "17", "company_name": "Wagons-Lits/Cook S. A.", "location": "Geneva"}]}, "conversation_id": "cfc9048d-dca1-44f2-81fe-5a07540f145b", "score": {"f1_score": 0.58, "precision": 0.5769230769230769, "recall": 0.5769230769230769, "true_positives": 30, "false_positives": 22, "false_negatives": 22, "field_scores": {"entries[2].location": {"response": "Dornach (Solothurn)", "ground_truth": "Dornach (Solothurn)", "score": 1.0}, "entries[1].entry_id": {"response": "2", "ground_truth": "156089_1321093_11-2", "score": 0.09999999999999998}, "entries[1].company_name": {"response": "Imperial Airways Ltd.", "ground_truth": "Imperial Airways Ltd.", "score": 1.0}, "entries[15].company_name": {"response": "Swiss Bank Corporation", "ground_truth": "Swiss Bank Corporation", "score": 1.0}, "entries[14].location": {"response": "Basle", "ground_truth": "Basle", "score": 1.0}, "entries[0].entry_id": {"response": "1", "ground_truth": "156089_1321093_11-1", "score": 0.09999999999999998}, "entries[10].company_name": {"response": "Banque F\u00e9d\u00e9rale S. A.", "ground_truth": "Banque F\u00e9d\u00e9rale S.A.", "score": 0.975609756097561}, "page_id": {"response": "9", "ground_truth": "156089_1321093_11", "score": 0.11111111111111116}, "entries[2].entry_id": {"response": "3", "ground_truth": "156089_1321093_11-3", "score": 0.09999999999999998}, "entries[14].company_name": {"response": "Swiss Bank Corporation", "ground_truth": "Swiss Bank Corporation", "score": 1.0}, "entries[12].entry_id": {"response": "13", "ground_truth": "156089_1321093_11-13", "score": 0.18181818181818177}, "entries[7].entry_id": {"response": "8", "ground_truth": "156089_1321093_11-8", "score": 0.09999999999999998}, "entries[5].entry_id": {"response": "6", "ground_truth": "156089_1321093_11-6", "score": 0.09999999999999998}, "entries[7].company_name": {"response": "Society of Chemical Industry in Basle", "ground_truth": "Society of Chemical Industry in Basle", "score": 1.0}, "entries[16].location": {"response": "Geneva", "ground_truth": "Geneva", "score": 1.0}, "entries[13].entry_id": {"response": "14", "ground_truth": "156089_1321093_11-14", "score": 0.18181818181818177}, "entries[9].location": {"response": "Arlesheim", "ground_truth": "Arlesheim", "score": 1.0}, "entries[0].company_name": {"response": "Crowe & Co., Ltd.", "ground_truth": "Crowe & Co., Ltd.", "score": 1.0}, "entries[5].company_name": {"response": "Clayton Aniline Co., Ltd.", "ground_truth": "Clayton Aniline Co., Ltd.", "score": 1.0}, "entries[16].company_name": {"response": "Wagons-Lits/Cook S. A.", "ground_truth": "Wagons-Lits/Cook S.A.", "score": 0.9767441860465115}, "entries[11].location": {"response": "London", "ground_truth": "London E.C. 3.", "score": 0.6}, "entries[2].company_name": {"response": "Metallwerke A.G.", "ground_truth": "Metallwerke A.G.", "score": 1.0}, "entries[11].entry_id": {"response": "12", "ground_truth": "156089_1321093_11-12", "score": 0.18181818181818177}, "entries[6].location": {"response": "Basle", "ground_truth": "Basle", "score": 1.0}, "entries[8].location": {"response": "Basle", "ground_truth": "Basle", "score": 1.0}, "entries[4].entry_id": {"response": "5", "ground_truth": "156089_1321093_11-5", "score": 0.09999999999999998}, "entries[11].company_name": {"response": "Barclays Bank Ltd.", "ground_truth": "Barclays Bank Ltd. (Foreign Branch)", "score": 0.679245283018868}, "entries[3].company_name": {"response": "Aluminium-Industrie-Aktien-Gesellschaft", "ground_truth": "Aluminium-Industrie-Aktien-Gesellschaft", "score": 1.0}, "entries[3].location": {"response": "Neuhausen", "ground_truth": "Neuhausen", "score": 1.0}, "entries[4].location": {"response": "Basle", "ground_truth": "Basle", "score": 1.0}, "entries[4].company_name": {"response": "Chemische Fabrik vorm. Sandoz", "ground_truth": "Chemische Fabrik vorm. Sandoz", "score": 1.0}, "entries[0].location": {"response": "Basle", "ground_truth": "Basle", "score": 1.0}, "entries[9].company_name": {"response": "Rayon A.-G.", "ground_truth": "Rayon A.-G. (Merchants)", "score": 0.6470588235294117}, "entries[3].entry_id": {"response": "4", "ground_truth": "156089_1321093_11-4", "score": 0.09999999999999998}, "entries[8].entry_id": {"response": "9", "ground_truth": "156089_1321093_11-9", "score": 0.09999999999999998}, "entries[10].location": {"response": "Vevey", "ground_truth": "Vevey", "score": 1.0}, "entries[9].entry_id": {"response": "10", "ground_truth": "156089_1321093_11-10", "score": 0.18181818181818177}, "entries[1].location": {"response": "Croydon", "ground_truth": "Croydon", "score": 1.0}, "entries[13].company_name": {"response": "Lloyds and National Provincial Foreign Bank, Ltd.", "ground_truth": "Lloyds and National Provincial Foreign Bank, Ltd.", "score": 1.0}, "entries[12].company_name": {"response": "Galland & Co.", "ground_truth": "Galland & Co.", "score": 1.0}, "entries[6].entry_id": {"response": "7", "ground_truth": "156089_1321093_11-7", "score": 0.09999999999999998}, "entries[10].entry_id": {"response": "11", "ground_truth": "156089_1321093_11-11", "score": 0.18181818181818177}, "entries[15].entry_id": {"response": "16", "ground_truth": "156089_1321093_11-16", "score": 0.18181818181818177}, "entries[13].location": {"response": "Geneva", "ground_truth": "Geneva", "score": 1.0}, "entries[16].entry_id": {"response": "17", "ground_truth": "156089_1321093_11-17", "score": 0.18181818181818177}, "entries[8].company_name": {"response": "J. Hopf & Co.", "ground_truth": "J. Hopf & Co. (Merchants)", "score": 0.6842105263157895}, "entries[12].location": {"response": "Lausanne", "ground_truth": "Lausanne", "score": 1.0}, "entries[5].location": {"response": "Manchester", "ground_truth": "Manchester", "score": 1.0}, "entries[15].location": {"response": "Lausanne", "ground_truth": "Lausanne", "score": 1.0}, "entries[14].entry_id": {"response": "15", "ground_truth": "156089_1321093_11-15", "score": 0.18181818181818177}, "entries[7].location": {"response": "Basle", "ground_truth": "Basle", "score": 1.0}, "entries[6].company_name": {"response": "J. R. Geigy, A.-G.", "ground_truth": "J. R. Geigy, A.-G.", "score": 1.0}}, "total_fields": 52}, "raw_response": "{\"sdk_http_response\":{\"headers\":{\"content-type\":\"application/json; charset=UTF-8\",\"vary\":\"Origin, X-Origin, Referer\",\"content-encoding\":\"gzip\",\"date\":\"Mon, 16 Mar 2026 18:10:06 GMT\",\"server\":\"scaffolding on HTTPServer2\",\"x-xss-protection\":\"0\",\"x-frame-options\":\"SAMEORIGIN\",\"x-content-type-options\":\"nosniff\",\"server-timing\":\"gfet4t7; dur=7604\",\"alt-svc\":\"h3=\\\":443\\\"; ma=2592000,h3-29=\\\":443\\\"; ma=2592000\",\"transfer-encoding\":\"chunked\"},\"body\":null},\"candidates\":[{\"content\":{\"parts\":[{\"media_resolution\":null,\"code_execution_result\":null,\"executable_code\":null,\"file_data\":null,\"function_call\":null,\"function_response\":null,\"inline_data\":null,\"text\":\"{\\n  \\\"page_id\\\": \\\"9\\\",\\n  \\\"entries\\\": [\\n    {\\n      \\\"entry_id\\\": \\\"1\\\",\\n      \\\"company_name\\\": \\\"Crowe & Co., Ltd.\\\",\\n      \\\"location\\\": \\\"Basle\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"2\\\",\\n      \\\"company_name\\\": \\\"Imperial Airways Ltd.\\\",\\n      \\\"location\\\": \\\"Croydon\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"3\\\",\\n      \\\"company_name\\\": \\\"Metallwerke A.G.\\\",\\n      \\\"location\\\": \\\"Dornach (Solothurn)\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"4\\\",\\n      \\\"company_name\\\": \\\"Aluminium-Industrie-Aktien-Gesellschaft\\\",\\n      \\\"location\\\": \\\"Neuhausen\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"5\\\",\\n      \\\"company_name\\\": \\\"Chemische Fabrik vorm. Sandoz\\\",\\n      \\\"location\\\": \\\"Basle\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"6\\\",\\n      \\\"company_name\\\": \\\"Clayton Aniline Co., Ltd.\\\",\\n      \\\"location\\\": \\\"Manchester\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"7\\\",\\n      \\\"company_name\\\": \\\"J. R. Geigy, A.-G.\\\",\\n      \\\"location\\\": \\\"Basle\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"8\\\",\\n      \\\"company_name\\\": \\\"Society of Chemical Industry in Basle\\\",\\n      \\\"location\\\": \\\"Basle\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"9\\\",\\n      \\\"company_name\\\": \\\"J. Hopf & Co.\\\",\\n      \\\"location\\\": \\\"Basle\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"10\\\",\\n      \\\"company_name\\\": \\\"Rayon A.-G.\\\",\\n      \\\"location\\\": \\\"Arlesheim\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"11\\\",\\n      \\\"company_name\\\": \\\"Banque F\u00e9d\u00e9rale S. A.\\\",\\n      \\\"location\\\": \\\"Vevey\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"12\\\",\\n      \\\"company_name\\\": \\\"Barclays Bank Ltd.\\\",\\n      \\\"location\\\": \\\"London\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"13\\\",\\n      \\\"company_name\\\": \\\"Galland & Co.\\\",\\n      \\\"location\\\": \\\"Lausanne\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"14\\\",\\n      \\\"company_name\\\": \\\"Lloyds and National Provincial Foreign Bank, Ltd.\\\",\\n      \\\"location\\\": \\\"Geneva\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"15\\\",\\n      \\\"company_name\\\": \\\"Swiss Bank Corporation\\\",\\n      \\\"location\\\": \\\"Basle\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"16\\\",\\n      \\\"company_name\\\": \\\"Swiss Bank Corporation\\\",\\n      \\\"location\\\": \\\"Lausanne\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"17\\\",\\n      \\\"company_name\\\": \\\"Wagons-Lits/Cook S. A.\\\",\\n      \\\"location\\\": \\\"Geneva\\\"\\n    }\\n  ]\\n}\",\"thought\":null,\"thought_signature\":\"EjQKMgG-Pvb7KMrgOtlwOS1uMhe1A24n-NEZSMtgDw9dekPzi8SveBDxIjk9kHEoa02CO6Ag\",\"video_metadata\":null}],\"role\":\"model\"},\"citation_metadata\":null,\"finish_message\":null,\"token_count\":null,\"finish_reason\":\"STOP\",\"avg_logprobs\":null,\"grounding_metadata\":null,\"index\":0,\"logprobs_result\":null,\"safety_ratings\":null,\"url_context_metadata\":null}],\"create_time\":null,\"model_version\":\"gemini-3.1-flash-lite-preview\",\"prompt_feedback\":null,\"response_id\":\"fke4aaHyEqHusAKfteKBDQ\",\"usage_metadata\":{\"cache_tokens_details\":null,\"cached_content_token_count\":null,\"candidates_token_count\":724,\"candidates_tokens_details\":null,\"prompt_token_count\":1107,\"prompt_tokens_details\":[{\"modality\":\"TEXT\",\"token_count\":27},{\"modality\":\"IMAGE\",\"token_count\":1080}],\"thoughts_token_count\":null,\"tool_use_prompt_token_count\":null,\"tool_use_prompt_tokens_details\":null,\"total_token_count\":1831,\"traffic_type\":null},\"automatic_function_calling_history\":[],\"parsed\":{\"page_id\":\"9\",\"entries\":[{\"entry_id\":\"1\",\"company_name\":\"Crowe & Co., Ltd.\",\"location\":\"Basle\"},{\"entry_id\":\"2\",\"company_name\":\"Imperial Airways Ltd.\",\"location\":\"Croydon\"},{\"entry_id\":\"3\",\"company_name\":\"Metallwerke A.G.\",\"location\":\"Dornach (Solothurn)\"},{\"entry_id\":\"4\",\"company_name\":\"Aluminium-Industrie-Aktien-Gesellschaft\",\"location\":\"Neuhausen\"},{\"entry_id\":\"5\",\"company_name\":\"Chemische Fabrik vorm. Sandoz\",\"location\":\"Basle\"},{\"entry_id\":\"6\",\"company_name\":\"Clayton Aniline Co., Ltd.\",\"location\":\"Manchester\"},{\"entry_id\":\"7\",\"company_name\":\"J. R. Geigy, A.-G.\",\"location\":\"Basle\"},{\"entry_id\":\"8\",\"company_name\":\"Society of Chemical Industry in Basle\",\"location\":\"Basle\"},{\"entry_id\":\"9\",\"company_name\":\"J. Hopf & Co.\",\"location\":\"Basle\"},{\"entry_id\":\"10\",\"company_name\":\"Rayon A.-G.\",\"location\":\"Arlesheim\"},{\"entry_id\":\"11\",\"company_name\":\"Banque F\u00e9d\u00e9rale S. A.\",\"location\":\"Vevey\"},{\"entry_id\":\"12\",\"company_name\":\"Barclays Bank Ltd.\",\"location\":\"London\"},{\"entry_id\":\"13\",\"company_name\":\"Galland & Co.\",\"location\":\"Lausanne\"},{\"entry_id\":\"14\",\"company_name\":\"Lloyds and National Provincial Foreign Bank, Ltd.\",\"location\":\"Geneva\"},{\"entry_id\":\"15\",\"company_name\":\"Swiss Bank Corporation\",\"location\":\"Basle\"},{\"entry_id\":\"16\",\"company_name\":\"Swiss Bank Corporation\",\"location\":\"Lausanne\"},{\"entry_id\":\"17\",\"company_name\":\"Wagons-Lits/Cook S. A.\",\"location\":\"Geneva\"}]}}"}, "scoring": {"f1_micro": 0.44059153493115755, "f1_macro": 0.42, "micro_precision": 0.4458204334365325, "micro_recall": 0.43548387096774194, "total_instances": 15, "total_tp": 432, "total_fp": 537, "total_fn": 560, "cost_summary": {"total_input_tokens": 16723, "total_output_tokens": 14504, "total_tokens": 31227, "input_cost_usd": 0.00418075, "output_cost_usd": 0.021755999999999998, "total_cost_usd": 0.02593675}}, "normalized_score": 42.0}