{"_id": {"$oid": "69d4eb12b877594bc5718d6f"}, "test_id": "T0836", "benchmark": "company_lists", "date": "2026-03-25", "tags": {"document-type": ["book-page"], "writing": ["printed"], "century": [20], "language": ["en", "de"], "layout": ["list"], "entry-type": ["company"], "task": ["information-extraction"]}, "contributors": ["lea_kasper", "sorin_marti"], "hidden": false, "config": {"provider": "alibaba", "model": "qwen3.5-35b-a3b", "dataclass": "ListPage", "temperature": 0.5, "role_description": "You are a Historian", "prompt_file": "prompt_min.txt", "rules": "{\"base_url\": \"https://ws-wkjpbv6ov7sqlgqe.ap-southeast-1.maas.aliyuncs.com/compatible-mode/v1\"}", "legacy_test": false}, "prompt": "- Answer in valid JSON.\n- The page ID is given as {page_id}.\n", "results": {"text": "{\"page_id\":\"28\",\"entries\":[{\"entry_id\":\"1\",\"company_name\":\"Hermann Thorens\",\"location\":\"Ste. Croix\"},{\"entry_id\":\"2\",\"company_name\":\"\\\"Simex\\\" Soc. Coop.\",\"location\":\"3, Place St. Fran\u00e7ois, Lausanne\"},{\"entry_id\":\"3\",\"company_name\":\"Fabrique d'Automobiles \\\"Berna\\\" S. A.\",\"location\":\"Olten\"},{\"entry_id\":\"4\",\"company_name\":\"Emil Birkh\u00e4user & Co.\",\"location\":\"11, Elisabethenstrasse, Basle\"},{\"entry_id\":\"5\",\"company_name\":\"Imprimerie de l'Ere Nouvelle\",\"location\":\"12, Rue de la Louve, Lausanne\"},{\"entry_id\":\"6\",\"company_name\":\"Kreis & Co.\",\"location\":\"21, Petersgraben, Basle\"},{\"entry_id\":\"7\",\"company_name\":\"S\u00e4uberlin & Pfeiffer S. A.\",\"location\":\"Vevey\"},{\"entry_id\":\"8\",\"company_name\":\"Fr. Schenkel-Wyss\",\"location\":\"60, Huttenstrasse, Zurich\"},{\"entry_id\":\"9\",\"company_name\":\"Lovell & Christmas, Ltd.\",\"location\":\"West Smithfield, London, E. C. 1.\"},{\"entry_id\":\"10\",\"company_name\":\"E. Osswald (Wholesale)\",\"location\":\"16, Kreuzplatz, Zurich\"},{\"entry_id\":\"11\",\"company_name\":\"Winandy & Co.\",\"location\":\"16, Rue de Bourg, Lausanne\"},{\"entry_id\":\"12\",\"company_name\":\"Pro Lemanio\",\"location\":\"Grand Ch\u00eane, Lausanne\"},{\"entry_id\":\"13\",\"company_name\":\"Th. Roussy, \\\"Librairie Anglaise\\\"\",\"location\":\"3, Rue de Bourg, Lausanne\"},{\"entry_id\":\"14\",\"company_name\":\"Schindler & Co.\",\"location\":\"Lucerne\"},{\"entry_id\":\"15\",\"company_name\":\"Sulzer Fr\u00e8res S. A.\",\"location\":\"Winterthur\"},{\"entry_id\":\"16\",\"company_name\":\"Basle Warehouse Co., Ltd.\",\"location\":\"1, Erlenstrasse, Basle\"},{\"entry_id\":\"17\",\"company_name\":\"Canadian Pacific Railway Co.\",\"location\":\"62-65, Charing Cross, London S. W. 1.\"},{\"entry_id\":\"18\",\"company_name\":\"Crowe & Co., Ltd.\",\"location\":\"67, Nauenstrasse, Basle\"},{\"entry_id\":\"19\",\"company_name\":\"Danzas & Co., A. G.\",\"location\":\"Basle\"},{\"entry_id\":\"20\",\"company_name\":\"Dominion Express Company of Canada\",\"location\":\"62\u201365, Charing Cross, London S. W. 1.\"},{\"entry_id\":\"21\",\"company_name\":\"Galland & Co.\",\"location\":\"3, Place St. Fran\u00e7ois, Lausanne\"},{\"entry_id\":\"22\",\"company_name\":\"Goth & Co. (General Agents of the Canadian Pacific Railway Co. and of the Dominion Express Co. of Canada)\",\"location\":\"45, Elisabethenstrasse, Basle\"},{\"entry_id\":\"23\",\"company_name\":\"Charles ImObersteg & Co.\",\"location\":\"30, Aeschengraben, Basle\"}]}", "model": "qwen3.5-35b-a3b", "provider": "alibaba", "finish_reason": "stop", "usage": {"input_tokens": 2715, "output_tokens": 1084, "total_tokens": 3799, "input_cost_usd": 0.00067875, "output_cost_usd": 0.002168, "estimated_cost_usd": 0.00284675}, "duration": 14.776832580566406, "timestamp": "2026-03-25T10:17:23.770229", "parsed": {"page_id": "28", "entries": [{"entry_id": "1", "company_name": "Hermann Thorens", "location": "Ste. Croix"}, {"entry_id": "2", "company_name": "\"Simex\" Soc. Coop.", "location": "3, Place St. Fran\u00e7ois, Lausanne"}, {"entry_id": "3", "company_name": "Fabrique d'Automobiles \"Berna\" S. A.", "location": "Olten"}, {"entry_id": "4", "company_name": "Emil Birkh\u00e4user & Co.", "location": "11, Elisabethenstrasse, Basle"}, {"entry_id": "5", "company_name": "Imprimerie de l'Ere Nouvelle", "location": "12, Rue de la Louve, Lausanne"}, {"entry_id": "6", "company_name": "Kreis & Co.", "location": "21, Petersgraben, Basle"}, {"entry_id": "7", "company_name": "S\u00e4uberlin & Pfeiffer S. A.", "location": "Vevey"}, {"entry_id": "8", "company_name": "Fr. Schenkel-Wyss", "location": "60, Huttenstrasse, Zurich"}, {"entry_id": "9", "company_name": "Lovell & Christmas, Ltd.", "location": "West Smithfield, London, E. C. 1."}, {"entry_id": "10", "company_name": "E. Osswald (Wholesale)", "location": "16, Kreuzplatz, Zurich"}, {"entry_id": "11", "company_name": "Winandy & Co.", "location": "16, Rue de Bourg, Lausanne"}, {"entry_id": "12", "company_name": "Pro Lemanio", "location": "Grand Ch\u00eane, Lausanne"}, {"entry_id": "13", "company_name": "Th. Roussy, \"Librairie Anglaise\"", "location": "3, Rue de Bourg, Lausanne"}, {"entry_id": "14", "company_name": "Schindler & Co.", "location": "Lucerne"}, {"entry_id": "15", "company_name": "Sulzer Fr\u00e8res S. A.", "location": "Winterthur"}, {"entry_id": "16", "company_name": "Basle Warehouse Co., Ltd.", "location": "1, Erlenstrasse, Basle"}, {"entry_id": "17", "company_name": "Canadian Pacific Railway Co.", "location": "62-65, Charing Cross, London S. W. 1."}, {"entry_id": "18", "company_name": "Crowe & Co., Ltd.", "location": "67, Nauenstrasse, Basle"}, {"entry_id": "19", "company_name": "Danzas & Co., A. G.", "location": "Basle"}, {"entry_id": "20", "company_name": "Dominion Express Company of Canada", "location": "62\u201365, Charing Cross, London S. W. 1."}, {"entry_id": "21", "company_name": "Galland & Co.", "location": "3, Place St. Fran\u00e7ois, Lausanne"}, {"entry_id": "22", "company_name": "Goth & Co. (General Agents of the Canadian Pacific Railway Co. and of the Dominion Express Co. of Canada)", "location": "45, Elisabethenstrasse, Basle"}, {"entry_id": "23", "company_name": "Charles ImObersteg & Co.", "location": "30, Aeschengraben, Basle"}]}, "conversation_id": "73ffdba9-8dcc-4023-8b5d-37b02e12cc0a", "score": {"f1_score": 0.28, "precision": 0.2857142857142857, "recall": 0.273972602739726, "true_positives": 20, "false_positives": 50, "false_negatives": 53, "field_scores": {"entries[15].location": {"response": "1, Erlenstrasse, Basle", "ground_truth": "Winterthur", "score": 0.1875}, "entries[0].entry_id": {"response": "1", "ground_truth": "156089_1321086_40-1", "score": 0.09999999999999998}, "entries[17].entry_id": {"response": "18", "ground_truth": "156089_1321086_40-18", "score": 0.18181818181818177}, "entries[23].entry_id": {"response": "", "ground_truth": "156089_1321086_40-24", "score": 0.0}, "entries[8].entry_id": {"response": "9", "ground_truth": "156089_1321086_40-9", "score": 0.09999999999999998}, "entries[9].company_name": {"response": "E. Osswald (Wholesale)", "ground_truth": "E. Osswald", "score": 0.625}, "entries[2].location": {"response": "Olten", "ground_truth": "Olten", "score": 1.0}, "entries[14].company_name": {"response": "Sulzer Fr\u00e8res S. A.", "ground_truth": "Sulzer Fr\u00e8res S. A.", "score": 1.0}, "entries[16].company_name": {"response": "Canadian Pacific Railway Co.", "ground_truth": "Basle Warehouse Co., Ltd.", "score": 0.26415094339622647}, "entries[16].location": {"response": "62-65, Charing Cross, London S. W. 1.", "ground_truth": "Basle", "score": 0.09523809523809523}, "entries[19].company_name": {"response": "Dominion Express Company of Canada", "ground_truth": "Danzas & Co., A. G.", "score": 0.30188679245283023}, "entries[6].location": {"response": "Vevey", "ground_truth": "Vevey", "score": 1.0}, "entries[10].entry_id": {"response": "11", "ground_truth": "156089_1321086_40-11", "score": 0.18181818181818177}, "entries[11].location": {"response": "Grand Ch\u00eane, Lausanne", "ground_truth": "Lausanne", "score": 0.5517241379310345}, "entries[6].company_name": {"response": "S\u00e4uberlin & Pfeiffer S. A.", "ground_truth": "S\u00e4uberlin & Pfeiffer S. A.", "score": 1.0}, "entries[19].location": {"response": "62\u201365, Charing Cross, London S. W. 1.", "ground_truth": "Basle", "score": 0.09523809523809523}, "entries[1].entry_id": {"response": "2", "ground_truth": "156089_1321086_40-2", "score": 0.09999999999999998}, "entries[3].location": {"response": "11, Elisabethenstrasse, Basle", "ground_truth": "Basle", "score": 0.2941176470588235}, "entries[5].company_name": {"response": "Kreis & Co.", "ground_truth": "Kreis & Co.", "score": 1.0}, "entries[7].location": {"response": "60, Huttenstrasse, Zurich", "ground_truth": "Zurich", "score": 0.3870967741935484}, "entries[15].entry_id": {"response": "16", "ground_truth": "156089_1321086_40-16", "score": 0.18181818181818177}, "entries[16].entry_id": {"response": "17", "ground_truth": "156089_1321086_40-17", "score": 0.18181818181818177}, "entries[22].company_name": {"response": "Charles ImObersteg & Co.", "ground_truth": "Goth & Co.", "score": 0.4117647058823529}, "entries[0].company_name": {"response": "Hermann Thorens", "ground_truth": "Hermann Thorens", "score": 1.0}, "entries[13].location": {"response": "Lucerne", "ground_truth": "Lucerne", "score": 1.0}, "entries[4].entry_id": {"response": "5", "ground_truth": "156089_1321086_40-5", "score": 0.09999999999999998}, "entries[14].entry_id": {"response": "15", "ground_truth": "156089_1321086_40-15", "score": 0.18181818181818177}, "entries[10].company_name": {"response": "Winandy & Co.", "ground_truth": "Winandy & Co.", "score": 1.0}, "entries[22].entry_id": {"response": "23", "ground_truth": "156089_1321086_40-23", "score": 0.18181818181818177}, "entries[5].location": {"response": "21, Petersgraben, Basle", "ground_truth": "Basle", "score": 0.3571428571428571}, "entries[7].company_name": {"response": "Fr. Schenkel-Wyss", "ground_truth": "Fr. Schenkel-Wyss", "score": 1.0}, "entries[3].entry_id": {"response": "4", "ground_truth": "156089_1321086_40-4", "score": 0.09999999999999998}, "entries[8].company_name": {"response": "Lovell & Christmas, Ltd.", "ground_truth": "Lovell & Christmas, Ltd.", "score": 1.0}, "entries[11].company_name": {"response": "Pro Lemanio", "ground_truth": "Pro Lemano", "score": 0.9523809523809522}, "entries[13].entry_id": {"response": "14", "ground_truth": "156089_1321086_40-14", "score": 0.18181818181818177}, "entries[23].company_name": {"response": "", "ground_truth": "Charles ImObersteg & Co.", "score": 0.0}, "entries[21].location": {"response": "45, Elisabethenstrasse, Basle", "ground_truth": "Lausanne", "score": 0.2162162162162162}, "entries[21].entry_id": {"response": "22", "ground_truth": "156089_1321086_40-22", "score": 0.18181818181818177}, "entries[20].entry_id": {"response": "21", "ground_truth": "156089_1321086_40-21", "score": 0.18181818181818177}, "entries[21].company_name": {"response": "Goth & Co. (General Agents of the Canadian Pacific Railway Co. and of the Dominion Express Co. of Canada)", "ground_truth": "Galland & Co.", "score": 0.2033898305084746}, "entries[9].location": {"response": "16, Kreuzplatz, Zurich", "ground_truth": "Zurich", "score": 0.4285714285714286}, "entries[3].company_name": {"response": "Emil Birkh\u00e4user & Co.", "ground_truth": "Emil Birkh\u00e4user & Co.", "score": 1.0}, "entries[6].entry_id": {"response": "7", "ground_truth": "156089_1321086_40-7", "score": 0.09999999999999998}, "entries[22].location": {"response": "30, Aeschengraben, Basle", "ground_truth": "Basle", "score": 0.3448275862068966}, "entries[23].location": {"response": "", "ground_truth": "Basle", "score": 0.0}, "entries[1].location": {"response": "3, Place St. Fran\u00e7ois, Lausanne", "ground_truth": "Lausanne", "score": 0.41025641025641024}, "entries[19].entry_id": {"response": "20", "ground_truth": "156089_1321086_40-20", "score": 0.18181818181818177}, "entries[1].company_name": {"response": "\"Simex\" Soc. Coop.", "ground_truth": "\"Simex\" Soc. Coop.", "score": 1.0}, "entries[10].location": {"response": "16, Rue de Bourg, Lausanne", "ground_truth": "Lausanne", "score": 0.4705882352941176}, "entries[17].company_name": {"response": "Crowe & Co., Ltd.", "ground_truth": "Canadian Pacific Railway Co.", "score": 0.2666666666666667}, "entries[2].company_name": {"response": "Fabrique d'Automobiles \"Berna\" S. A.", "ground_truth": "Fabrique d'Automobiles \"Berna\" S. A.", "score": 1.0}, "entries[13].company_name": {"response": "Schindler & Co.", "ground_truth": "Schindler & Co.", "score": 1.0}, "entries[9].entry_id": {"response": "10", "ground_truth": "156089_1321086_40-10", "score": 0.18181818181818177}, "entries[17].location": {"response": "67, Nauenstrasse, Basle", "ground_truth": "London S. W. 1", "score": 0.1081081081081081}, "entries[18].entry_id": {"response": "19", "ground_truth": "156089_1321086_40-19", "score": 0.18181818181818177}, "entries[20].location": {"response": "3, Place St. Fran\u00e7ois, Lausanne", "ground_truth": "London S. W. 1", "score": 0.2222222222222222}, "entries[7].entry_id": {"response": "8", "ground_truth": "156089_1321086_40-8", "score": 0.09999999999999998}, "entries[20].company_name": {"response": "Galland & Co.", "ground_truth": "Dominion Express Company of Canada", "score": 0.21276595744680848}, "entries[4].company_name": {"response": "Imprimerie de l'Ere Nouvelle", "ground_truth": "Imprimerie de l'Ere Nouvelle", "score": 1.0}, "entries[4].location": {"response": "12, Rue de la Louve, Lausanne", "ground_truth": "Lausanne", "score": 0.4324324324324324}, "entries[11].entry_id": {"response": "12", "ground_truth": "156089_1321086_40-12", "score": 0.18181818181818177}, "entries[14].location": {"response": "Winterthur", "ground_truth": "Winterthur", "score": 1.0}, "entries[18].location": {"response": "Basle", "ground_truth": "Basle", "score": 1.0}, "entries[12].company_name": {"response": "Th. Roussy, \"Librairie Anglaise\"", "ground_truth": "Th. Roussy, \"Librairie Anglaise\"", "score": 1.0}, "entries[12].location": {"response": "3, Rue de Bourg, Lausanne", "ground_truth": "Lausanne", "score": 0.48484848484848486}, "entries[12].entry_id": {"response": "13", "ground_truth": "156089_1321086_40-13", "score": 0.18181818181818177}, "page_id": {"response": "28", "ground_truth": "156089_1321086_40", "score": 0.21052631578947367}, "entries[15].company_name": {"response": "Basle Warehouse Co., Ltd.", "ground_truth": "Sulzer Fr\u00e8res S. A.", "score": 0.4545454545454546}, "entries[18].company_name": {"response": "Danzas & Co., A. G.", "ground_truth": "Crowe & Co., Ltd.", "score": 0.5}, "entries[8].location": {"response": "West Smithfield, London, E. C. 1.", "ground_truth": "London, E. C. 1", "score": 0.625}, "entries[0].location": {"response": "Ste. Croix", "ground_truth": "Ste. Croix", "score": 1.0}, "entries[5].entry_id": {"response": "6", "ground_truth": "156089_1321086_40-6", "score": 0.09999999999999998}, "entries[2].entry_id": {"response": "3", "ground_truth": "156089_1321086_40-3", "score": 0.09999999999999998}}, "total_fields": 73}, "raw_response": "{\"id\":\"chatcmpl-a777930a-46b1-9648-80f1-f15f5fe7447f\",\"choices\":[{\"finish_reason\":\"stop\",\"index\":0,\"logprobs\":null,\"message\":{\"content\":\"{\\n  \\\"page_id\\\": \\\"28\\\",\\n  \\\"entries\\\": [\\n    {\\n      \\\"entry_id\\\": \\\"1\\\",\\n      \\\"company_name\\\": \\\"Hermann Thorens\\\",\\n      \\\"location\\\": \\\"Ste. Croix\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"2\\\",\\n      \\\"company_name\\\": \\\"\\\\\\\"Simex\\\\\\\" Soc. Coop.\\\",\\n      \\\"location\\\": \\\"3, Place St. Fran\u00e7ois, Lausanne\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"3\\\",\\n      \\\"company_name\\\": \\\"Fabrique d'Automobiles \\\\\\\"Berna\\\\\\\" S. A.\\\",\\n      \\\"location\\\": \\\"Olten\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"4\\\",\\n      \\\"company_name\\\": \\\"Emil Birkh\u00e4user & Co.\\\",\\n      \\\"location\\\": \\\"11, Elisabethenstrasse, Basle\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"5\\\",\\n      \\\"company_name\\\": \\\"Imprimerie de l'Ere Nouvelle\\\",\\n      \\\"location\\\": \\\"12, Rue de la Louve, Lausanne\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"6\\\",\\n      \\\"company_name\\\": \\\"Kreis & Co.\\\",\\n      \\\"location\\\": \\\"21, Petersgraben, Basle\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"7\\\",\\n      \\\"company_name\\\": \\\"S\u00e4uberlin & Pfeiffer S. A.\\\",\\n      \\\"location\\\": \\\"Vevey\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"8\\\",\\n      \\\"company_name\\\": \\\"Fr. Schenkel-Wyss\\\",\\n      \\\"location\\\": \\\"60, Huttenstrasse, Zurich\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"9\\\",\\n      \\\"company_name\\\": \\\"Lovell & Christmas, Ltd.\\\",\\n      \\\"location\\\": \\\"West Smithfield, London, E. C. 1.\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"10\\\",\\n      \\\"company_name\\\": \\\"E. Osswald (Wholesale)\\\",\\n      \\\"location\\\": \\\"16, Kreuzplatz, Zurich\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"11\\\",\\n      \\\"company_name\\\": \\\"Winandy & Co.\\\",\\n      \\\"location\\\": \\\"16, Rue de Bourg, Lausanne\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"12\\\",\\n      \\\"company_name\\\": \\\"Pro Lemanio\\\",\\n      \\\"location\\\": \\\"Grand Ch\u00eane, Lausanne\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"13\\\",\\n      \\\"company_name\\\": \\\"Th. Roussy, \\\\\\\"Librairie Anglaise\\\\\\\"\\\",\\n      \\\"location\\\": \\\"3, Rue de Bourg, Lausanne\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"14\\\",\\n      \\\"company_name\\\": \\\"Schindler & Co.\\\",\\n      \\\"location\\\": \\\"Lucerne\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"15\\\",\\n      \\\"company_name\\\": \\\"Sulzer Fr\u00e8res S. A.\\\",\\n      \\\"location\\\": \\\"Winterthur\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"16\\\",\\n      \\\"company_name\\\": \\\"Basle Warehouse Co., Ltd.\\\",\\n      \\\"location\\\": \\\"1, Erlenstrasse, Basle\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"17\\\",\\n      \\\"company_name\\\": \\\"Canadian Pacific Railway Co.\\\",\\n      \\\"location\\\": \\\"62-65, Charing Cross, London S. W. 1.\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"18\\\",\\n      \\\"company_name\\\": \\\"Crowe & Co., Ltd.\\\",\\n      \\\"location\\\": \\\"67, Nauenstrasse, Basle\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"19\\\",\\n      \\\"company_name\\\": \\\"Danzas & Co., A. G.\\\",\\n      \\\"location\\\": \\\"Basle\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"20\\\",\\n      \\\"company_name\\\": \\\"Dominion Express Company of Canada\\\",\\n      \\\"location\\\": \\\"62\u201365, Charing Cross, London S. W. 1.\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"21\\\",\\n      \\\"company_name\\\": \\\"Galland & Co.\\\",\\n      \\\"location\\\": \\\"3, Place St. Fran\u00e7ois, Lausanne\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"22\\\",\\n      \\\"company_name\\\": \\\"Goth & Co. (General Agents of the Canadian Pacific Railway Co. and of the Dominion Express Co. of Canada)\\\",\\n      \\\"location\\\": \\\"45, Elisabethenstrasse, Basle\\\"\\n    },\\n    {\\n      \\\"entry_id\\\": \\\"23\\\",\\n      \\\"company_name\\\": \\\"Charles ImObersteg & Co.\\\",\\n      \\\"location\\\": \\\"30, Aeschengraben, Basle\\\"\\n    }\\n  ]\\n}\",\"refusal\":null,\"role\":\"assistant\",\"annotations\":null,\"audio\":null,\"function_call\":null,\"tool_calls\":null,\"reasoning_content\":\"\"}}],\"created\":1774430244,\"model\":\"qwen3.5-35b-a3b\",\"object\":\"chat.completion\",\"service_tier\":null,\"system_fingerprint\":null,\"usage\":{\"completion_tokens\":1084,\"prompt_tokens\":2715,\"total_tokens\":3799,\"completion_tokens_details\":{\"accepted_prediction_tokens\":null,\"audio_tokens\":null,\"reasoning_tokens\":null,\"rejected_prediction_tokens\":null,\"text_tokens\":1084},\"prompt_tokens_details\":{\"audio_tokens\":null,\"cached_tokens\":null,\"image_tokens\":2503,\"text_tokens\":212}}}"}, "scoring": {"f1_micro": 0.4306784660766962, "f1_macro": 0.44333333333333336, "micro_precision": 0.42034548944337813, "micro_recall": 0.4415322580645161, "total_instances": 15, "total_tp": 438, "total_fp": 604, "total_fn": 554, "cost_summary": {"total_input_tokens": 40921, "total_output_tokens": 15970, "total_tokens": 56891, "input_cost_usd": 0.010230250000000001, "output_cost_usd": 0.03194, "total_cost_usd": 0.042170250000000006}}, "normalized_score": 44.333333333333336}