{"id": 1, "parent_run_id": "569784d8605018c3", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you today friend... [sha256:4d080c4227e4]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 838, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-29T19:58:48Z"}
{"id": 2, "parent_run_id": "569784d8605018c3", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you today friend... [sha256:4d080c4227e4]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 614, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-29T19:58:49Z"}
{"id": 3, "parent_run_id": "569784d8605018c3", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you today friend... [sha256:4d080c4227e4]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 1899, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-29T19:58:51Z"}
{"id": 4, "parent_run_id": "2302a774d4a3315e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I really love this restaurant the food was amazing... [sha256:6e7bb65413ec]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1344, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-29T19:59:04Z"}
{"id": 5, "parent_run_id": "2302a774d4a3315e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I really love this restaurant the food was amazing... [sha256:6e7bb65413ec]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1435, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-29T19:59:06Z"}
{"id": 6, "parent_run_id": "2302a774d4a3315e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I really love this restaurant the food was amazing... [sha256:6e7bb65413ec]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 3345, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-29T19:59:09Z"}
{"id": 8, "parent_run_id": "e94044497284edf1", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 1099, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-04-29T20:00:17Z"}
{"id": 9, "parent_run_id": "e94044497284edf1", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 655, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-04-29T20:00:18Z"}
{"id": 10, "parent_run_id": "e94044497284edf1", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 724, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-04-29T20:00:19Z"}
{"id": 11, "parent_run_id": "05c6aa064dd2e7a0", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 574, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-04-29T20:00:19Z"}
{"id": 12, "parent_run_id": "05c6aa064dd2e7a0", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 932, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-04-29T20:00:20Z"}
{"id": 13, "parent_run_id": "05c6aa064dd2e7a0", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 921, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-04-29T20:00:21Z"}
{"id": 14, "parent_run_id": "32e48ed3f24ea2c1", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 689, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-29T20:00:22Z"}
{"id": 15, "parent_run_id": "32e48ed3f24ea2c1", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 730, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-29T20:00:22Z"}
{"id": 16, "parent_run_id": "32e48ed3f24ea2c1", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 767, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-29T20:00:23Z"}
{"id": 17, "parent_run_id": "5d2ea7de89422385", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hola como estas hoy amigo mio... [sha256:bf779100908f]", "output_text": "es", "expected": "es", "correct": 1, "latency_ms": 1179, "input_tokens": 7, "output_tokens": 1, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-29T20:00:24Z"}
{"id": 18, "parent_run_id": "5d2ea7de89422385", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hola como estas hoy amigo mio... [sha256:bf779100908f]", "output_text": "es", "expected": "es", "correct": 1, "latency_ms": 643, "input_tokens": 7, "output_tokens": 1, "cost_eur": 8.249999999999999e-07, "error": null, "created_at": "2026-04-29T20:00:25Z"}
{"id": 19, "parent_run_id": "5d2ea7de89422385", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hola como estas hoy amigo mio... [sha256:bf779100908f]", "output_text": "es", "expected": "es", "correct": 1, "latency_ms": 652, "input_tokens": 7, "output_tokens": 1, "cost_eur": 1.6499999999999999e-06, "error": null, "created_at": "2026-04-29T20:00:26Z"}
{"id": 20, "parent_run_id": "e537c69770f0b8ea", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Привіт як справи сьогодні дорогий друже... [sha256:600c8ff1780c]", "output_text": "uk", "expected": "uk", "correct": 1, "latency_ms": 530, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-29T20:00:26Z"}
{"id": 21, "parent_run_id": "e537c69770f0b8ea", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Привіт як справи сьогодні дорогий друже... [sha256:600c8ff1780c]", "output_text": "uk", "expected": "uk", "correct": 1, "latency_ms": 729, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-29T20:00:27Z"}
{"id": 22, "parent_run_id": "e537c69770f0b8ea", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Привіт як справи сьогодні дорогий друже... [sha256:600c8ff1780c]", "output_text": "uk", "expected": "uk", "correct": 1, "latency_ms": 1575, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-29T20:00:29Z"}
{"id": 23, "parent_run_id": "50a22d316f18cf47", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hoe gaat het met u vandaag mijn vriend... [sha256:3ecfbd873836]", "output_text": "nl", "expected": "nl", "correct": 1, "latency_ms": 684, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-29T20:00:29Z"}
{"id": 24, "parent_run_id": "50a22d316f18cf47", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hoe gaat het met u vandaag mijn vriend... [sha256:3ecfbd873836]", "output_text": "nl", "expected": "nl", "correct": 1, "latency_ms": 712, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-29T20:00:30Z"}
{"id": 25, "parent_run_id": "50a22d316f18cf47", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hoe gaat het met u vandaag mijn vriend... [sha256:3ecfbd873836]", "output_text": "nl", "expected": "nl", "correct": 1, "latency_ms": 1669, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-29T20:00:32Z"}
{"id": 26, "parent_run_id": "94a0b7c186760859", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "你好今天过得怎么样朋友... [sha256:3d13851981d1]", "output_text": "zh", "expected": "zh", "correct": 1, "latency_ms": 782, "input_tokens": 2, "output_tokens": 1, "cost_eur": 1.75e-06, "error": null, "created_at": "2026-04-29T20:00:32Z"}
{"id": 27, "parent_run_id": "94a0b7c186760859", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "你好今天过得怎么样朋友... [sha256:3d13851981d1]", "output_text": "zh", "expected": "zh", "correct": 1, "latency_ms": 922, "input_tokens": 2, "output_tokens": 1, "cost_eur": 4.5e-07, "error": null, "created_at": "2026-04-29T20:00:33Z"}
{"id": 28, "parent_run_id": "94a0b7c186760859", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "你好今天过得怎么样朋友... [sha256:3d13851981d1]", "output_text": "zh", "expected": "zh", "correct": 1, "latency_ms": 498, "input_tokens": 2, "output_tokens": 1, "cost_eur": 9e-07, "error": null, "created_at": "2026-04-29T20:00:34Z"}
{"id": 29, "parent_run_id": "0c70d782b2f58231", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "こんにちは今日はどうですか友達... [sha256:46529f264bf3]", "output_text": "ja", "expected": "ja", "correct": 1, "latency_ms": 1134, "input_tokens": 3, "output_tokens": 1, "cost_eur": 2e-06, "error": null, "created_at": "2026-04-29T20:00:35Z"}
{"id": 30, "parent_run_id": "0c70d782b2f58231", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "こんにちは今日はどうですか友達... [sha256:46529f264bf3]", "output_text": "ja", "expected": "ja", "correct": 1, "latency_ms": 711, "input_tokens": 3, "output_tokens": 1, "cost_eur": 5.25e-07, "error": null, "created_at": "2026-04-29T20:00:36Z"}
{"id": 31, "parent_run_id": "0c70d782b2f58231", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "こんにちは今日はどうですか友達... [sha256:46529f264bf3]", "output_text": "ja", "expected": "ja", "correct": 1, "latency_ms": 630, "input_tokens": 3, "output_tokens": 1, "cost_eur": 1.05e-06, "error": null, "created_at": "2026-04-29T20:00:36Z"}
{"id": 32, "parent_run_id": "fffea5f0c027c8f5", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 668, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-29T20:00:37Z"}
{"id": 33, "parent_run_id": "fffea5f0c027c8f5", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 739, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-29T20:00:38Z"}
{"id": 34, "parent_run_id": "fffea5f0c027c8f5", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 582, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-29T20:00:38Z"}
{"id": 35, "parent_run_id": "07ef8841e44ea536", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 673, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-29T20:00:39Z"}
{"id": 36, "parent_run_id": "07ef8841e44ea536", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 741, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-29T20:00:40Z"}
{"id": 37, "parent_run_id": "07ef8841e44ea536", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1284, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-29T20:00:41Z"}
{"id": 38, "parent_run_id": "9a106432baeaf861", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 744, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-29T20:00:42Z"}
{"id": 39, "parent_run_id": "9a106432baeaf861", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2687, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-29T20:00:45Z"}
{"id": 40, "parent_run_id": "9a106432baeaf861", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1098, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-29T20:00:46Z"}
{"id": 41, "parent_run_id": "0edef7c530affbb4", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Best purchase I've made all year highly recommend... [sha256:0195cabc4f26]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 545, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-29T20:00:46Z"}
{"id": 42, "parent_run_id": "0edef7c530affbb4", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Best purchase I've made all year highly recommend... [sha256:0195cabc4f26]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1505, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-29T20:00:48Z"}
{"id": 43, "parent_run_id": "0edef7c530affbb4", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Best purchase I've made all year highly recommend... [sha256:0195cabc4f26]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 565, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-29T20:00:48Z"}
{"id": 44, "parent_run_id": "01f4d3c1c7da7883", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Worst customer service ever do not buy from them... [sha256:b28f1fc6fa48]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 768, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-29T20:00:49Z"}
{"id": 45, "parent_run_id": "01f4d3c1c7da7883", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Worst customer service ever do not buy from them... [sha256:b28f1fc6fa48]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1565, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-29T20:00:51Z"}
{"id": 46, "parent_run_id": "01f4d3c1c7da7883", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Worst customer service ever do not buy from them... [sha256:b28f1fc6fa48]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 788, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-29T20:00:51Z"}
{"id": 47, "parent_run_id": "d8a49ab8c7b6e594", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "It's an okay product nothing special... [sha256:b3ae3150c611]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 685, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-29T20:00:52Z"}
{"id": 48, "parent_run_id": "d8a49ab8c7b6e594", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "It's an okay product nothing special... [sha256:b3ae3150c611]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2031, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-29T20:00:54Z"}
{"id": 49, "parent_run_id": "d8a49ab8c7b6e594", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "It's an okay product nothing special... [sha256:b3ae3150c611]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 543, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-29T20:00:55Z"}
{"id": 50, "parent_run_id": "3a00bfa5d27f1c9f", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Amazing quality and fast shipping very happy... [sha256:c1aec6b2c7ab]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 701, "input_tokens": 11, "output_tokens": 2, "cost_eur": 5.25e-06, "error": null, "created_at": "2026-04-29T20:00:55Z"}
{"id": 51, "parent_run_id": "3a00bfa5d27f1c9f", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Amazing quality and fast shipping very happy... [sha256:c1aec6b2c7ab]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1543, "input_tokens": 11, "output_tokens": 2, "cost_eur": 1.425e-06, "error": null, "created_at": "2026-04-29T20:00:57Z"}
{"id": 52, "parent_run_id": "3a00bfa5d27f1c9f", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Amazing quality and fast shipping very happy... [sha256:c1aec6b2c7ab]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 543, "input_tokens": 11, "output_tokens": 2, "cost_eur": 2.85e-06, "error": null, "created_at": "2026-04-29T20:00:58Z"}
{"id": 53, "parent_run_id": "0ca4f51008950c0e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Disappointed with the build quality breaks easily... [sha256:6ff0625c7dd9]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 784, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-29T20:00:58Z"}
{"id": 54, "parent_run_id": "0ca4f51008950c0e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Disappointed with the build quality breaks easily... [sha256:6ff0625c7dd9]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1217, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-29T20:01:00Z"}
{"id": 55, "parent_run_id": "0ca4f51008950c0e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Disappointed with the build quality breaks easily... [sha256:6ff0625c7dd9]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 5079, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-29T20:01:05Z"}
{"id": 56, "parent_run_id": "ec1344e0b4909373", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 1257, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-04-29T20:08:13Z"}
{"id": 57, "parent_run_id": "ec1344e0b4909373", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 707, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-04-29T20:08:13Z"}
{"id": 58, "parent_run_id": "ec1344e0b4909373", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 689, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-04-29T20:08:14Z"}
{"id": 59, "parent_run_id": "664b86f26994faa2", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 735, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-04-29T20:08:15Z"}
{"id": 60, "parent_run_id": "664b86f26994faa2", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 1256, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-04-29T20:08:16Z"}
{"id": 61, "parent_run_id": "664b86f26994faa2", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 838, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-04-29T20:08:17Z"}
{"id": 62, "parent_run_id": "93ff4fced80ca0fa", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 701, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-29T20:08:18Z"}
{"id": 63, "parent_run_id": "93ff4fced80ca0fa", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 1214, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-29T20:08:19Z"}
{"id": 64, "parent_run_id": "93ff4fced80ca0fa", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 535, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-29T20:08:19Z"}
{"id": 65, "parent_run_id": "ce6e905815e92e8c", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hola como estas hoy amigo mio... [sha256:bf779100908f]", "output_text": "es", "expected": "es", "correct": 1, "latency_ms": 647, "input_tokens": 7, "output_tokens": 1, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-29T20:08:20Z"}
{"id": 66, "parent_run_id": "ce6e905815e92e8c", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hola como estas hoy amigo mio... [sha256:bf779100908f]", "output_text": "es", "expected": "es", "correct": 1, "latency_ms": 1384, "input_tokens": 7, "output_tokens": 1, "cost_eur": 8.249999999999999e-07, "error": null, "created_at": "2026-04-29T20:08:21Z"}
{"id": 67, "parent_run_id": "ce6e905815e92e8c", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hola como estas hoy amigo mio... [sha256:bf779100908f]", "output_text": "es", "expected": "es", "correct": 1, "latency_ms": 655, "input_tokens": 7, "output_tokens": 1, "cost_eur": 1.6499999999999999e-06, "error": null, "created_at": "2026-04-29T20:08:22Z"}
{"id": 68, "parent_run_id": "c3a22b3921b646df", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Привіт як справи сьогодні дорогий друже... [sha256:600c8ff1780c]", "output_text": "uk", "expected": "uk", "correct": 1, "latency_ms": 685, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-29T20:08:23Z"}
{"id": 69, "parent_run_id": "c3a22b3921b646df", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Привіт як справи сьогодні дорогий друже... [sha256:600c8ff1780c]", "output_text": "uk", "expected": "uk", "correct": 1, "latency_ms": 2440, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-29T20:08:25Z"}
{"id": 70, "parent_run_id": "c3a22b3921b646df", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Привіт як справи сьогодні дорогий друже... [sha256:600c8ff1780c]", "output_text": "uk", "expected": "uk", "correct": 1, "latency_ms": 771, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-29T20:08:26Z"}
{"id": 71, "parent_run_id": "13e301ea8d02670b", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hoe gaat het met u vandaag mijn vriend... [sha256:3ecfbd873836]", "output_text": "nl", "expected": "nl", "correct": 1, "latency_ms": 778, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-29T20:08:27Z"}
{"id": 72, "parent_run_id": "13e301ea8d02670b", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hoe gaat het met u vandaag mijn vriend... [sha256:3ecfbd873836]", "output_text": "nl", "expected": "nl", "correct": 1, "latency_ms": 1633, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-29T20:08:28Z"}
{"id": 73, "parent_run_id": "13e301ea8d02670b", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hoe gaat het met u vandaag mijn vriend... [sha256:3ecfbd873836]", "output_text": "nl", "expected": "nl", "correct": 1, "latency_ms": 553, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-29T20:08:29Z"}
{"id": 74, "parent_run_id": "7b52928ba96c33e5", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "你好今天过得怎么样朋友... [sha256:3d13851981d1]", "output_text": "zh", "expected": "zh", "correct": 1, "latency_ms": 839, "input_tokens": 2, "output_tokens": 1, "cost_eur": 1.75e-06, "error": null, "created_at": "2026-04-29T20:08:30Z"}
{"id": 75, "parent_run_id": "7b52928ba96c33e5", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "你好今天过得怎么样朋友... [sha256:3d13851981d1]", "output_text": "zh", "expected": "zh", "correct": 1, "latency_ms": 1025, "input_tokens": 2, "output_tokens": 1, "cost_eur": 4.5e-07, "error": null, "created_at": "2026-04-29T20:08:31Z"}
{"id": 76, "parent_run_id": "7b52928ba96c33e5", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "你好今天过得怎么样朋友... [sha256:3d13851981d1]", "output_text": "zh", "expected": "zh", "correct": 1, "latency_ms": 950, "input_tokens": 2, "output_tokens": 1, "cost_eur": 9e-07, "error": null, "created_at": "2026-04-29T20:08:32Z"}
{"id": 77, "parent_run_id": "432df99b281bf0d2", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "こんにちは今日はどうですか友達... [sha256:46529f264bf3]", "output_text": "ja", "expected": "ja", "correct": 1, "latency_ms": 657, "input_tokens": 3, "output_tokens": 1, "cost_eur": 2e-06, "error": null, "created_at": "2026-04-29T20:08:32Z"}
{"id": 78, "parent_run_id": "432df99b281bf0d2", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "こんにちは今日はどうですか友達... [sha256:46529f264bf3]", "output_text": "ja", "expected": "ja", "correct": 1, "latency_ms": 1300, "input_tokens": 3, "output_tokens": 1, "cost_eur": 5.25e-07, "error": null, "created_at": "2026-04-29T20:08:34Z"}
{"id": 79, "parent_run_id": "432df99b281bf0d2", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "こんにちは今日はどうですか友達... [sha256:46529f264bf3]", "output_text": "ja", "expected": "ja", "correct": 1, "latency_ms": 911, "input_tokens": 3, "output_tokens": 1, "cost_eur": 1.05e-06, "error": null, "created_at": "2026-04-29T20:08:35Z"}
{"id": 80, "parent_run_id": "4ef59567b86b0c49", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 685, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-29T20:08:35Z"}
{"id": 81, "parent_run_id": "4ef59567b86b0c49", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 738, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-29T20:08:36Z"}
{"id": 82, "parent_run_id": "4ef59567b86b0c49", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 734, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-29T20:08:37Z"}
{"id": 83, "parent_run_id": "1f0ae896b944f838", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1197, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-29T20:08:38Z"}
{"id": 84, "parent_run_id": "1f0ae896b944f838", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1123, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-29T20:08:39Z"}
{"id": 85, "parent_run_id": "1f0ae896b944f838", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 638, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-29T20:08:40Z"}
{"id": 86, "parent_run_id": "0923bd99ff5aab18", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 695, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-29T20:08:40Z"}
{"id": 87, "parent_run_id": "0923bd99ff5aab18", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 1644, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-29T20:08:42Z"}
{"id": 88, "parent_run_id": "0923bd99ff5aab18", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 509, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-29T20:08:43Z"}
{"id": 89, "parent_run_id": "c6d76954f935f0c3", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Best purchase I've made all year highly recommend... [sha256:0195cabc4f26]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1068, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-29T20:08:44Z"}
{"id": 90, "parent_run_id": "c6d76954f935f0c3", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Best purchase I've made all year highly recommend... [sha256:0195cabc4f26]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1212, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-29T20:08:45Z"}
{"id": 91, "parent_run_id": "c6d76954f935f0c3", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Best purchase I've made all year highly recommend... [sha256:0195cabc4f26]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1248, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-29T20:08:46Z"}
{"id": 92, "parent_run_id": "7e9ddefae86b675b", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Worst customer service ever do not buy from them... [sha256:b28f1fc6fa48]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 688, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-29T20:08:47Z"}
{"id": 93, "parent_run_id": "7e9ddefae86b675b", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Worst customer service ever do not buy from them... [sha256:b28f1fc6fa48]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 918, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-29T20:08:48Z"}
{"id": 94, "parent_run_id": "7e9ddefae86b675b", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Worst customer service ever do not buy from them... [sha256:b28f1fc6fa48]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 588, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-29T20:08:48Z"}
{"id": 95, "parent_run_id": "b41e9185c0867d9e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "It's an okay product nothing special... [sha256:b3ae3150c611]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 809, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-29T20:08:49Z"}
{"id": 96, "parent_run_id": "b41e9185c0867d9e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "It's an okay product nothing special... [sha256:b3ae3150c611]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 1462, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-29T20:08:51Z"}
{"id": 97, "parent_run_id": "b41e9185c0867d9e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "It's an okay product nothing special... [sha256:b3ae3150c611]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 472, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-29T20:08:51Z"}
{"id": 98, "parent_run_id": "25a0d93cb5e72fd8", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Amazing quality and fast shipping very happy... [sha256:c1aec6b2c7ab]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 481, "input_tokens": 11, "output_tokens": 2, "cost_eur": 5.25e-06, "error": null, "created_at": "2026-04-29T20:08:52Z"}
{"id": 99, "parent_run_id": "25a0d93cb5e72fd8", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Amazing quality and fast shipping very happy... [sha256:c1aec6b2c7ab]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 925, "input_tokens": 11, "output_tokens": 2, "cost_eur": 1.425e-06, "error": null, "created_at": "2026-04-29T20:08:53Z"}
{"id": 100, "parent_run_id": "25a0d93cb5e72fd8", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Amazing quality and fast shipping very happy... [sha256:c1aec6b2c7ab]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 909, "input_tokens": 11, "output_tokens": 2, "cost_eur": 2.85e-06, "error": null, "created_at": "2026-04-29T20:08:53Z"}
{"id": 101, "parent_run_id": "37f42aaa449acc66", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Disappointed with the build quality breaks easily... [sha256:6ff0625c7dd9]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1117, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-29T20:08:55Z"}
{"id": 102, "parent_run_id": "37f42aaa449acc66", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Disappointed with the build quality breaks easily... [sha256:6ff0625c7dd9]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 830, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-29T20:08:55Z"}
{"id": 103, "parent_run_id": "37f42aaa449acc66", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Disappointed with the build quality breaks easily... [sha256:6ff0625c7dd9]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 627, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-29T20:08:56Z"}
{"id": 104, "parent_run_id": "a5a9b705bad1ddf1", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 804, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-04-29T20:08:57Z"}
{"id": 105, "parent_run_id": "9674a9901a3acb26", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 620, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-04-29T20:08:58Z"}
{"id": 106, "parent_run_id": "0d5c9963edc33d5e", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 688, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-29T20:08:58Z"}
{"id": 109, "parent_run_id": "58f716fafc753cee", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 1133, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-04-29T20:09:32Z"}
{"id": 110, "parent_run_id": "2f7f7337874c60d6", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 780, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-04-29T20:09:32Z"}
{"id": 111, "parent_run_id": "b1f2379c878183d0", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 920, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-29T20:09:33Z"}
{"id": 163, "parent_run_id": "c09e5aaa82d3a5c2", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1238, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T03:57:18Z"}
{"id": 164, "parent_run_id": "c09e5aaa82d3a5c2", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1785, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-30T03:57:20Z"}
{"id": 165, "parent_run_id": "c09e5aaa82d3a5c2", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1889, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-30T03:57:21Z"}
{"id": 166, "parent_run_id": "5cd01907ecb5ab71", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 682, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T03:57:22Z"}
{"id": 167, "parent_run_id": "5cd01907ecb5ab71", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1318, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-30T03:57:23Z"}
{"id": 168, "parent_run_id": "5cd01907ecb5ab71", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 726, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-30T03:57:24Z"}
{"id": 169, "parent_run_id": "5f801996834333cd", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 551, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-30T03:57:25Z"}
{"id": 170, "parent_run_id": "5f801996834333cd", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2284, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-30T03:57:27Z"}
{"id": 171, "parent_run_id": "5f801996834333cd", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 833, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-30T03:57:28Z"}
{"id": 172, "parent_run_id": "f8071966fc082d1d", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 654, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-04-30T03:57:29Z"}
{"id": 173, "parent_run_id": "f8071966fc082d1d", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 621, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-04-30T03:57:29Z"}
{"id": 174, "parent_run_id": "f8071966fc082d1d", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 701, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-04-30T03:57:30Z"}
{"id": 175, "parent_run_id": "7b592c04cec63660", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 671, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-04-30T03:57:31Z"}
{"id": 176, "parent_run_id": "7b592c04cec63660", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 620, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-04-30T03:57:31Z"}
{"id": 177, "parent_run_id": "7b592c04cec63660", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 490, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-04-30T03:57:32Z"}
{"id": 178, "parent_run_id": "49df5566ec200f98", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 628, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-30T03:57:32Z"}
{"id": 179, "parent_run_id": "49df5566ec200f98", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 575, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-30T03:57:33Z"}
{"id": 180, "parent_run_id": "49df5566ec200f98", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 2250, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-30T03:57:35Z"}
{"id": 181, "parent_run_id": "5c99f533b4ddc7c5", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 706, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-04-30T03:57:36Z"}
{"id": 182, "parent_run_id": "da12cecb8bddffa2", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 673, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-04-30T03:57:37Z"}
{"id": 183, "parent_run_id": "5d2591057eab2f18", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 698, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T03:57:37Z"}
{"id": 184, "parent_run_id": "163d3748659dfe17", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 459, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-04-30T03:57:38Z"}
{"id": 185, "parent_run_id": "163d3748659dfe17", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 513, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-04-30T03:57:38Z"}
{"id": 186, "parent_run_id": "163d3748659dfe17", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 1470, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-04-30T03:57:40Z"}
{"id": 187, "parent_run_id": "afd16d4d9c56a3ac", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 603, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-04-30T03:57:40Z"}
{"id": 188, "parent_run_id": "afd16d4d9c56a3ac", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 659, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-04-30T03:57:41Z"}
{"id": 189, "parent_run_id": "afd16d4d9c56a3ac", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 419, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-04-30T03:57:41Z"}
{"id": 190, "parent_run_id": "56c37aa4132a570a", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 769, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-30T03:57:42Z"}
{"id": 191, "parent_run_id": "56c37aa4132a570a", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 978, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-30T03:57:43Z"}
{"id": 192, "parent_run_id": "56c37aa4132a570a", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 1406, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-30T03:57:45Z"}
{"id": 193, "parent_run_id": "9ff49a2c51560b34", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 596, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T03:57:45Z"}
{"id": 194, "parent_run_id": "9ff49a2c51560b34", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1366, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-30T03:57:47Z"}
{"id": 195, "parent_run_id": "9ff49a2c51560b34", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 824, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-30T03:57:47Z"}
{"id": 196, "parent_run_id": "dbd9714b10d44175", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 645, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T03:57:48Z"}
{"id": 197, "parent_run_id": "dbd9714b10d44175", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 768, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-30T03:57:49Z"}
{"id": 198, "parent_run_id": "dbd9714b10d44175", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 546, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-30T03:57:49Z"}
{"id": 199, "parent_run_id": "0b4c8ac78f753d28", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 437, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-30T03:57:50Z"}
{"id": 200, "parent_run_id": "0b4c8ac78f753d28", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2030, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-30T03:57:52Z"}
{"id": 201, "parent_run_id": "0b4c8ac78f753d28", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 953, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-30T03:57:53Z"}
{"id": 202, "parent_run_id": "7c1d84e0de0c892d", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 730, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T03:57:54Z"}
{"id": 203, "parent_run_id": "7c1d84e0de0c892d", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1079, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-30T03:57:55Z"}
{"id": 204, "parent_run_id": "7c1d84e0de0c892d", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 882, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-30T03:57:55Z"}
{"id": 205, "parent_run_id": "5325c330ebb6d081", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 663, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T03:57:56Z"}
{"id": 206, "parent_run_id": "5325c330ebb6d081", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 830, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-30T03:57:57Z"}
{"id": 207, "parent_run_id": "5325c330ebb6d081", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 786, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-30T03:57:58Z"}
{"id": 208, "parent_run_id": "d1ae73c0de4af741", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 467, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-30T03:57:58Z"}
{"id": 209, "parent_run_id": "d1ae73c0de4af741", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1848, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-30T03:58:00Z"}
{"id": 210, "parent_run_id": "d1ae73c0de4af741", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 570, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-30T03:58:01Z"}
{"id": 211, "parent_run_id": "ee3688380110e8f5", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 712, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-04-30T03:58:01Z"}
{"id": 212, "parent_run_id": "ba4150af1e444210", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 696, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-04-30T03:58:02Z"}
{"id": 213, "parent_run_id": "0ead5a10d507a438", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 666, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T03:58:03Z"}
{"id": 214, "parent_run_id": "77eedc90a745b043", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\n  \"alice@example.com\",\n  \"bob.smith@test.org\"\n]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 876, "input_tokens": 15, "output_tokens": 15, "cost_eur": 2.25e-05, "error": null, "created_at": "2026-04-30T03:58:04Z"}
{"id": 215, "parent_run_id": "341b5fb21f215e13", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 590, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-04-30T03:58:04Z"}
{"id": 216, "parent_run_id": "5fdd56cf16bf18ed", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 651, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T03:58:05Z"}
{"id": 217, "parent_run_id": "b3e6999434c12f90", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1803, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T05:01:00Z"}
{"id": 218, "parent_run_id": "b3e6999434c12f90", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 715, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-30T05:01:00Z"}
{"id": 219, "parent_run_id": "b3e6999434c12f90", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 719, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-30T05:01:01Z"}
{"id": 220, "parent_run_id": "69693f3b4b4eb469", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 778, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T05:01:02Z"}
{"id": 221, "parent_run_id": "69693f3b4b4eb469", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1520, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-30T05:01:03Z"}
{"id": 222, "parent_run_id": "69693f3b4b4eb469", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 723, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-30T05:01:04Z"}
{"id": 223, "parent_run_id": "bf8e6fc6923a78e4", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 935, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-30T05:01:05Z"}
{"id": 224, "parent_run_id": "bf8e6fc6923a78e4", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2364, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-30T05:01:08Z"}
{"id": 225, "parent_run_id": "bf8e6fc6923a78e4", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 996, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-30T05:01:09Z"}
{"id": 226, "parent_run_id": "da9e2d4be31deafc", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 662, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-04-30T05:01:09Z"}
{"id": 227, "parent_run_id": "da9e2d4be31deafc", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 758, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-04-30T05:01:10Z"}
{"id": 228, "parent_run_id": "da9e2d4be31deafc", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 748, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-04-30T05:01:11Z"}
{"id": 229, "parent_run_id": "dc099b48b31646bb", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 641, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-04-30T05:01:11Z"}
{"id": 230, "parent_run_id": "dc099b48b31646bb", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 837, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-04-30T05:01:12Z"}
{"id": 231, "parent_run_id": "dc099b48b31646bb", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 788, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-04-30T05:01:13Z"}
{"id": 232, "parent_run_id": "acc5b8b8426fc539", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 900, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-30T05:01:14Z"}
{"id": 233, "parent_run_id": "acc5b8b8426fc539", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 951, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-30T05:01:15Z"}
{"id": 234, "parent_run_id": "acc5b8b8426fc539", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 631, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-30T05:01:15Z"}
{"id": 235, "parent_run_id": "e4c6a274897db81a", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 753, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-04-30T05:01:16Z"}
{"id": 236, "parent_run_id": "8eaa5b511ba7ceb3", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 868, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-04-30T05:01:17Z"}
{"id": 237, "parent_run_id": "260bced4c91a3626", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 920, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T05:01:18Z"}
{"id": 238, "parent_run_id": "cdb006de647d8323", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 973, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-04-30T05:01:19Z"}
{"id": 239, "parent_run_id": "cdb006de647d8323", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 825, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-04-30T05:01:20Z"}
{"id": 240, "parent_run_id": "cdb006de647d8323", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 702, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-04-30T05:01:21Z"}
{"id": 241, "parent_run_id": "382fec2a79835556", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 2711, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-04-30T05:01:23Z"}
{"id": 242, "parent_run_id": "382fec2a79835556", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 917, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-04-30T05:01:24Z"}
{"id": 243, "parent_run_id": "382fec2a79835556", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 442, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-04-30T05:01:25Z"}
{"id": 244, "parent_run_id": "8696116792cbd76a", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 691, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-30T05:01:25Z"}
{"id": 245, "parent_run_id": "8696116792cbd76a", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 617, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-30T05:01:26Z"}
{"id": 246, "parent_run_id": "8696116792cbd76a", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 710, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-30T05:01:27Z"}
{"id": 247, "parent_run_id": "22ec532678ff8f22", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 622, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T05:01:27Z"}
{"id": 248, "parent_run_id": "22ec532678ff8f22", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1087, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-30T05:01:28Z"}
{"id": 249, "parent_run_id": "22ec532678ff8f22", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 410, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-30T05:01:29Z"}
{"id": 250, "parent_run_id": "1bbd931ee93144a9", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 662, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T05:01:29Z"}
{"id": 251, "parent_run_id": "1bbd931ee93144a9", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1098, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-30T05:01:31Z"}
{"id": 252, "parent_run_id": "1bbd931ee93144a9", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 629, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-30T05:01:31Z"}
{"id": 253, "parent_run_id": "97adcbc6fabf19a9", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 634, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-30T05:01:32Z"}
{"id": 254, "parent_run_id": "97adcbc6fabf19a9", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Positive", "expected": "neutral", "correct": 0, "latency_ms": 4161, "input_tokens": 9, "output_tokens": 2, "cost_eur": 1.2749999999999999e-06, "error": null, "created_at": "2026-04-30T05:01:36Z"}
{"id": 255, "parent_run_id": "97adcbc6fabf19a9", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2210, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-30T05:01:38Z"}
{"id": 256, "parent_run_id": "12f0822948c8c417", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 608, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T05:01:39Z"}
{"id": 257, "parent_run_id": "12f0822948c8c417", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1203, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-30T05:01:40Z"}
{"id": 258, "parent_run_id": "12f0822948c8c417", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 385, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-30T05:01:40Z"}
{"id": 259, "parent_run_id": "a145be8a15eeedfa", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 2690, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T05:01:43Z"}
{"id": 260, "parent_run_id": "a145be8a15eeedfa", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1539, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-04-30T05:01:45Z"}
{"id": 261, "parent_run_id": "a145be8a15eeedfa", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 534, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-04-30T05:01:45Z"}
{"id": 262, "parent_run_id": "5310a92252d0f897", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 707, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-04-30T05:01:46Z"}
{"id": 263, "parent_run_id": "5310a92252d0f897", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2646, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-04-30T05:01:49Z"}
{"id": 264, "parent_run_id": "5310a92252d0f897", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 514, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-04-30T05:01:49Z"}
{"id": 265, "parent_run_id": "1d5458b42eac071b", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 767, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-04-30T05:01:50Z"}
{"id": 266, "parent_run_id": "bb34ce671346fd28", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 757, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-04-30T05:01:51Z"}
{"id": 267, "parent_run_id": "b3f98870bf2a6386", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 765, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T05:01:51Z"}
{"id": 268, "parent_run_id": "686efe1daaf6b507", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 851, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-04-30T05:01:52Z"}
{"id": 269, "parent_run_id": "e2bda82e8acaa770", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 742, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-04-30T05:01:53Z"}
{"id": 270, "parent_run_id": "eced7ec5717eeed3", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 663, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-04-30T05:01:54Z"}
{"id": 271, "parent_run_id": "f5e08181dd53d420", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1390, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-01T05:00:20Z"}
{"id": 272, "parent_run_id": "f5e08181dd53d420", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 745, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-01T05:00:21Z"}
{"id": 273, "parent_run_id": "f5e08181dd53d420", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1562, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-01T05:00:22Z"}
{"id": 274, "parent_run_id": "0b8d3a5acce62411", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 710, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-01T05:00:23Z"}
{"id": 275, "parent_run_id": "0b8d3a5acce62411", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1272, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-01T05:00:24Z"}
{"id": 276, "parent_run_id": "0b8d3a5acce62411", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 557, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-01T05:00:25Z"}
{"id": 277, "parent_run_id": "d98866809761018e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 727, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-01T05:00:25Z"}
{"id": 278, "parent_run_id": "d98866809761018e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 2000, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-01T05:00:27Z"}
{"id": 279, "parent_run_id": "d98866809761018e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 886, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-01T05:00:28Z"}
{"id": 280, "parent_run_id": "4a2105df029d21c8", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 699, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-01T05:00:29Z"}
{"id": 281, "parent_run_id": "4a2105df029d21c8", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 673, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-01T05:00:30Z"}
{"id": 282, "parent_run_id": "4a2105df029d21c8", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 808, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-01T05:00:31Z"}
{"id": 283, "parent_run_id": "89bd10524f4ad348", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 683, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-01T05:00:31Z"}
{"id": 284, "parent_run_id": "89bd10524f4ad348", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 695, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-01T05:00:32Z"}
{"id": 285, "parent_run_id": "89bd10524f4ad348", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 454, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-01T05:00:32Z"}
{"id": 286, "parent_run_id": "7724143b111c3db7", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 860, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-01T05:00:33Z"}
{"id": 287, "parent_run_id": "7724143b111c3db7", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 904, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-01T05:00:34Z"}
{"id": 288, "parent_run_id": "7724143b111c3db7", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 1373, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-01T05:00:36Z"}
{"id": 289, "parent_run_id": "79e8130e8c0f816e", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 796, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-01T05:00:36Z"}
{"id": 290, "parent_run_id": "c65adee1e55ddcfa", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 733, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-01T05:00:37Z"}
{"id": 291, "parent_run_id": "8be8d6cae651a103", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 1020, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-01T05:00:38Z"}
{"id": 292, "parent_run_id": "6ccccbfc79c76e35", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 532, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-01T05:00:39Z"}
{"id": 293, "parent_run_id": "6ccccbfc79c76e35", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 827, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-01T05:00:39Z"}
{"id": 294, "parent_run_id": "6ccccbfc79c76e35", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 765, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-01T05:00:40Z"}
{"id": 295, "parent_run_id": "0c47ced9d8d50e3f", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 749, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-01T05:00:41Z"}
{"id": 296, "parent_run_id": "0c47ced9d8d50e3f", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 617, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-01T05:00:42Z"}
{"id": 297, "parent_run_id": "0c47ced9d8d50e3f", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 844, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-01T05:00:42Z"}
{"id": 298, "parent_run_id": "418cc3e07572bede", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 615, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-01T05:00:43Z"}
{"id": 299, "parent_run_id": "418cc3e07572bede", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 941, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-01T05:00:44Z"}
{"id": 300, "parent_run_id": "418cc3e07572bede", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 453, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-01T05:00:44Z"}
{"id": 301, "parent_run_id": "335fbed6765f703d", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 909, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-01T05:00:45Z"}
{"id": 302, "parent_run_id": "335fbed6765f703d", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 857, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-01T05:00:46Z"}
{"id": 303, "parent_run_id": "335fbed6765f703d", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 601, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-01T05:00:47Z"}
{"id": 304, "parent_run_id": "0e4707492261c26a", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 794, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-01T05:00:48Z"}
{"id": 305, "parent_run_id": "0e4707492261c26a", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1341, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-01T05:00:49Z"}
{"id": 306, "parent_run_id": "0e4707492261c26a", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 526, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-01T05:00:50Z"}
{"id": 307, "parent_run_id": "1262a2b90563102e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 565, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-01T05:00:50Z"}
{"id": 308, "parent_run_id": "1262a2b90563102e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2129, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-01T05:00:52Z"}
{"id": 309, "parent_run_id": "1262a2b90563102e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 480, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-01T05:00:53Z"}
{"id": 310, "parent_run_id": "e99ad07c936f352e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 710, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-01T05:00:53Z"}
{"id": 311, "parent_run_id": "e99ad07c936f352e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1251, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-01T05:00:55Z"}
{"id": 312, "parent_run_id": "e99ad07c936f352e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 412, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-01T05:00:55Z"}
{"id": 313, "parent_run_id": "1d058112a46b915b", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 685, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-01T05:00:56Z"}
{"id": 314, "parent_run_id": "1d058112a46b915b", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1014, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-01T05:00:57Z"}
{"id": 315, "parent_run_id": "1d058112a46b915b", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 805, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-01T05:00:58Z"}
{"id": 316, "parent_run_id": "46bb09449fa21a52", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 2371, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-01T05:01:00Z"}
{"id": 317, "parent_run_id": "46bb09449fa21a52", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2672, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-01T05:01:03Z"}
{"id": 318, "parent_run_id": "46bb09449fa21a52", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 496, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-01T05:01:03Z"}
{"id": 319, "parent_run_id": "95d57e27968cbf8d", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 775, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-01T05:01:04Z"}
{"id": 320, "parent_run_id": "f4419a2f862019ac", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 760, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-01T05:01:05Z"}
{"id": 321, "parent_run_id": "a21d1fcd10cbc612", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 717, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-01T05:01:06Z"}
{"id": 322, "parent_run_id": "ea3ee2a70ce54be0", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 764, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-01T05:01:06Z"}
{"id": 323, "parent_run_id": "f63d1aedbc32f13e", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 594, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-01T05:01:07Z"}
{"id": 324, "parent_run_id": "fa26bb6eee780038", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 565, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-01T05:01:07Z"}
{"id": 325, "parent_run_id": "a520bffc3fa0df51", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1480, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-02T05:03:50Z"}
{"id": 326, "parent_run_id": "a520bffc3fa0df51", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 592, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-02T05:03:50Z"}
{"id": 327, "parent_run_id": "a520bffc3fa0df51", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 870, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-02T05:03:51Z"}
{"id": 328, "parent_run_id": "19be8f7f16f7698e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 918, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-02T05:03:52Z"}
{"id": 329, "parent_run_id": "19be8f7f16f7698e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1184, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-02T05:03:53Z"}
{"id": 330, "parent_run_id": "19be8f7f16f7698e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1209, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-02T05:03:54Z"}
{"id": 331, "parent_run_id": "65f05a6600f33b96", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "positive", "expected": "neutral", "correct": 0, "latency_ms": 457, "input_tokens": 9, "output_tokens": 2, "cost_eur": 4.75e-06, "error": null, "created_at": "2026-05-02T05:03:55Z"}
{"id": 332, "parent_run_id": "65f05a6600f33b96", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Positive", "expected": "neutral", "correct": 0, "latency_ms": 2602, "input_tokens": 9, "output_tokens": 2, "cost_eur": 1.2749999999999999e-06, "error": null, "created_at": "2026-05-02T05:03:57Z"}
{"id": 333, "parent_run_id": "65f05a6600f33b96", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 557, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-02T05:03:58Z"}
{"id": 334, "parent_run_id": "31f79c1b9f551bf0", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 833, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-02T05:03:59Z"}
{"id": 335, "parent_run_id": "c9f3d1c37d29e47a", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 684, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-02T05:04:00Z"}
{"id": 336, "parent_run_id": "0642c14ff1d01266", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 810, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-02T05:04:00Z"}
{"id": 337, "parent_run_id": "d1be3a01c6a4d7e2", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 476, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-02T05:04:01Z"}
{"id": 338, "parent_run_id": "d1be3a01c6a4d7e2", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 588, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-02T05:04:01Z"}
{"id": 339, "parent_run_id": "d1be3a01c6a4d7e2", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 819, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-02T05:04:02Z"}
{"id": 340, "parent_run_id": "937e65fa2bf26773", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 526, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-02T05:04:03Z"}
{"id": 341, "parent_run_id": "937e65fa2bf26773", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 952, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-02T05:04:04Z"}
{"id": 342, "parent_run_id": "937e65fa2bf26773", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 430, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-02T05:04:04Z"}
{"id": 343, "parent_run_id": "fd03af78aa73fca4", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 708, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-02T05:04:05Z"}
{"id": 344, "parent_run_id": "fd03af78aa73fca4", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 695, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-02T05:04:06Z"}
{"id": 345, "parent_run_id": "fd03af78aa73fca4", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 708, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-02T05:04:06Z"}
{"id": 346, "parent_run_id": "48bd8f99542a9ce2", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 713, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-02T05:04:07Z"}
{"id": 347, "parent_run_id": "48bd8f99542a9ce2", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 686, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-02T05:04:08Z"}
{"id": 348, "parent_run_id": "48bd8f99542a9ce2", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 842, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-02T05:04:09Z"}
{"id": 349, "parent_run_id": "27335671ef9ac90e", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 714, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-02T05:04:09Z"}
{"id": 350, "parent_run_id": "27335671ef9ac90e", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 2743, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-02T05:04:12Z"}
{"id": 351, "parent_run_id": "27335671ef9ac90e", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 864, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-02T05:04:13Z"}
{"id": 352, "parent_run_id": "5ef4043f6730fa37", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 456, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-02T05:04:13Z"}
{"id": 353, "parent_run_id": "5ef4043f6730fa37", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 633, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-02T05:04:14Z"}
{"id": 354, "parent_run_id": "5ef4043f6730fa37", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 1624, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-02T05:04:16Z"}
{"id": 355, "parent_run_id": "40572696c5d1a62e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 527, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-02T05:04:16Z"}
{"id": 356, "parent_run_id": "40572696c5d1a62e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 603, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-02T05:04:17Z"}
{"id": 357, "parent_run_id": "40572696c5d1a62e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 435, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-02T05:04:17Z"}
{"id": 358, "parent_run_id": "8708d3e09408a2a4", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 950, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-02T05:04:18Z"}
{"id": 359, "parent_run_id": "8708d3e09408a2a4", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 2165, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-02T05:04:20Z"}
{"id": 360, "parent_run_id": "8708d3e09408a2a4", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 966, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-02T05:04:21Z"}
{"id": 361, "parent_run_id": "1554805766880ea9", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 967, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-02T05:04:22Z"}
{"id": 362, "parent_run_id": "1554805766880ea9", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 2228, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-02T05:04:25Z"}
{"id": 363, "parent_run_id": "1554805766880ea9", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2202, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-02T05:04:27Z"}
{"id": 364, "parent_run_id": "708e9140dc72751a", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1598, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-02T05:04:28Z"}
{"id": 365, "parent_run_id": "708e9140dc72751a", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 973, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-02T05:04:29Z"}
{"id": 366, "parent_run_id": "708e9140dc72751a", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 464, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-02T05:04:30Z"}
{"id": 367, "parent_run_id": "a26fee4f295bd1cf", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 815, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-02T05:04:31Z"}
{"id": 368, "parent_run_id": "a26fee4f295bd1cf", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1258, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-02T05:04:32Z"}
{"id": 369, "parent_run_id": "a26fee4f295bd1cf", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 811, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-02T05:04:33Z"}
{"id": 370, "parent_run_id": "3447094880117721", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 435, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-02T05:04:33Z"}
{"id": 371, "parent_run_id": "3447094880117721", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 2928, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-02T05:04:36Z"}
{"id": 372, "parent_run_id": "3447094880117721", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 414, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-02T05:04:37Z"}
{"id": 373, "parent_run_id": "385e47e66d7792de", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 909, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-02T05:04:37Z"}
{"id": 374, "parent_run_id": "69b6b33263b58c7b", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 722, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-02T05:04:38Z"}
{"id": 375, "parent_run_id": "a53b6cb3ba8b1794", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 724, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-02T05:04:39Z"}
{"id": 376, "parent_run_id": "77dd92ef321fe0e5", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 736, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-02T05:04:40Z"}
{"id": 377, "parent_run_id": "9698f371b6eda0aa", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 749, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-02T05:04:40Z"}
{"id": 378, "parent_run_id": "2732284a37f76c99", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 606, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-02T05:04:41Z"}
{"id": 379, "parent_run_id": "be7c06e0e38d7727", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1603, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-03T05:01:13Z"}
{"id": 380, "parent_run_id": "be7c06e0e38d7727", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1197, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-03T05:01:14Z"}
{"id": 381, "parent_run_id": "be7c06e0e38d7727", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 2160, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-03T05:01:16Z"}
{"id": 382, "parent_run_id": "35ea294e7b5cd325", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 698, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-03T05:01:17Z"}
{"id": 383, "parent_run_id": "35ea294e7b5cd325", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 729, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-03T05:01:17Z"}
{"id": 384, "parent_run_id": "35ea294e7b5cd325", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 902, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-03T05:01:18Z"}
{"id": 385, "parent_run_id": "25e47c93feb6a59e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 612, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-03T05:01:19Z"}
{"id": 386, "parent_run_id": "25e47c93feb6a59e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 3966, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-03T05:01:23Z"}
{"id": 387, "parent_run_id": "25e47c93feb6a59e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1747, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-03T05:01:25Z"}
{"id": 388, "parent_run_id": "a0b9445bf3327626", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 678, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-03T05:01:25Z"}
{"id": 389, "parent_run_id": "3adf3c4909a63302", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 779, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-03T05:01:26Z"}
{"id": 390, "parent_run_id": "cd753c6788d62ffc", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 623, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-03T05:01:27Z"}
{"id": 391, "parent_run_id": "64a194fee9b083c7", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 623, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-03T05:01:27Z"}
{"id": 392, "parent_run_id": "64a194fee9b083c7", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 881, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-03T05:01:28Z"}
{"id": 393, "parent_run_id": "64a194fee9b083c7", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 1614, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-03T05:01:30Z"}
{"id": 394, "parent_run_id": "39331063492c10d6", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 458, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-03T05:01:30Z"}
{"id": 395, "parent_run_id": "39331063492c10d6", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 642, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-03T05:01:31Z"}
{"id": 396, "parent_run_id": "39331063492c10d6", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 474, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-03T05:01:31Z"}
{"id": 397, "parent_run_id": "a9cfa975f6bf8333", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 457, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-03T05:01:32Z"}
{"id": 398, "parent_run_id": "a9cfa975f6bf8333", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 685, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-03T05:01:33Z"}
{"id": 399, "parent_run_id": "a9cfa975f6bf8333", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 716, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-03T05:01:33Z"}
{"id": 400, "parent_run_id": "08648ea18ced865b", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 670, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-03T05:01:34Z"}
{"id": 401, "parent_run_id": "08648ea18ced865b", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 549, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-03T05:01:35Z"}
{"id": 402, "parent_run_id": "08648ea18ced865b", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 1002, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-03T05:01:36Z"}
{"id": 403, "parent_run_id": "0a967a3f3dcc802a", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 606, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-03T05:01:36Z"}
{"id": 404, "parent_run_id": "0a967a3f3dcc802a", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 759, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-03T05:01:37Z"}
{"id": 405, "parent_run_id": "0a967a3f3dcc802a", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 458, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-03T05:01:37Z"}
{"id": 406, "parent_run_id": "e78af948bfe0e40d", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 636, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-03T05:01:38Z"}
{"id": 407, "parent_run_id": "e78af948bfe0e40d", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 683, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-03T05:01:39Z"}
{"id": 408, "parent_run_id": "e78af948bfe0e40d", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 1052, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-03T05:01:40Z"}
{"id": 409, "parent_run_id": "0ef3230faa8e67be", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 534, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-03T05:01:40Z"}
{"id": 410, "parent_run_id": "0ef3230faa8e67be", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1126, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-03T05:01:42Z"}
{"id": 411, "parent_run_id": "0ef3230faa8e67be", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 759, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-03T05:01:42Z"}
{"id": 412, "parent_run_id": "10176a254af09444", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 675, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-03T05:01:43Z"}
{"id": 413, "parent_run_id": "10176a254af09444", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1189, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-03T05:01:44Z"}
{"id": 414, "parent_run_id": "10176a254af09444", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 637, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-03T05:01:45Z"}
{"id": 415, "parent_run_id": "8c61d1db2abcecbc", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 671, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-03T05:01:46Z"}
{"id": 416, "parent_run_id": "8c61d1db2abcecbc", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2300, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-03T05:01:48Z"}
{"id": 417, "parent_run_id": "8c61d1db2abcecbc", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 528, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-03T05:01:48Z"}
{"id": 418, "parent_run_id": "91c6066346700947", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 631, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-03T05:01:49Z"}
{"id": 419, "parent_run_id": "91c6066346700947", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 993, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-03T05:01:50Z"}
{"id": 420, "parent_run_id": "91c6066346700947", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 709, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-03T05:01:51Z"}
{"id": 421, "parent_run_id": "ecfd379c6d20a8f7", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 609, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-03T05:01:51Z"}
{"id": 422, "parent_run_id": "ecfd379c6d20a8f7", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1309, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-03T05:01:53Z"}
{"id": 423, "parent_run_id": "ecfd379c6d20a8f7", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 649, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-03T05:01:53Z"}
{"id": 424, "parent_run_id": "233e710412fc4d72", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 591, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-03T05:01:54Z"}
{"id": 425, "parent_run_id": "233e710412fc4d72", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2045, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-03T05:01:56Z"}
{"id": 426, "parent_run_id": "233e710412fc4d72", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 413, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-03T05:01:56Z"}
{"id": 427, "parent_run_id": "6a92b9cf2d1e6b76", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 557, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-03T05:01:57Z"}
{"id": 428, "parent_run_id": "8779fbed46a6517c", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 779, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-03T05:01:58Z"}
{"id": 429, "parent_run_id": "1d4c31254469ca10", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 651, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-03T05:01:58Z"}
{"id": 430, "parent_run_id": "edfb7921e1c94a2e", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 733, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-03T05:01:59Z"}
{"id": 431, "parent_run_id": "fbdc14aecea9a5a2", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 872, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-03T05:02:00Z"}
{"id": 432, "parent_run_id": "493224dc4f8830b9", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 680, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-03T05:02:01Z"}
{"id": 433, "parent_run_id": "c3c1a8aec3c1fce7", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1508, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-04T05:01:35Z"}
{"id": 434, "parent_run_id": "c3c1a8aec3c1fce7", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1055, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-04T05:01:37Z"}
{"id": 435, "parent_run_id": "c3c1a8aec3c1fce7", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 580, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-04T05:01:37Z"}
{"id": 436, "parent_run_id": "fea78e7b8d058865", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 673, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-04T05:01:38Z"}
{"id": 437, "parent_run_id": "fea78e7b8d058865", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1422, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-04T05:01:39Z"}
{"id": 438, "parent_run_id": "fea78e7b8d058865", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1219, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-04T05:01:40Z"}
{"id": 439, "parent_run_id": "66b1af4f1517e878", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 748, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-04T05:01:41Z"}
{"id": 440, "parent_run_id": "66b1af4f1517e878", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2399, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-04T05:01:44Z"}
{"id": 441, "parent_run_id": "66b1af4f1517e878", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1837, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-04T05:01:45Z"}
{"id": 442, "parent_run_id": "345cab077f770405", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 1118, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-04T05:01:47Z"}
{"id": 443, "parent_run_id": "36498ba563fbc347", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 678, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-04T05:01:47Z"}
{"id": 444, "parent_run_id": "0b0a23a9edf0a4ca", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 549, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-04T05:01:48Z"}
{"id": 445, "parent_run_id": "1516ec6bc1db288d", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 637, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-04T05:01:48Z"}
{"id": 446, "parent_run_id": "1516ec6bc1db288d", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 792, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-04T05:01:49Z"}
{"id": 447, "parent_run_id": "1516ec6bc1db288d", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 844, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-04T05:01:50Z"}
{"id": 448, "parent_run_id": "a13000c61ac2d2b5", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 648, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-04T05:01:51Z"}
{"id": 449, "parent_run_id": "a13000c61ac2d2b5", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 774, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-04T05:01:52Z"}
{"id": 450, "parent_run_id": "a13000c61ac2d2b5", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 853, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-04T05:01:52Z"}
{"id": 451, "parent_run_id": "0898dd58ae520395", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 690, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-04T05:01:53Z"}
{"id": 452, "parent_run_id": "0898dd58ae520395", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 611, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-04T05:01:54Z"}
{"id": 453, "parent_run_id": "0898dd58ae520395", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 860, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-04T05:01:55Z"}
{"id": 454, "parent_run_id": "923e666ee11f07df", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 722, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-04T05:01:55Z"}
{"id": 455, "parent_run_id": "923e666ee11f07df", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 788, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-04T05:01:56Z"}
{"id": 456, "parent_run_id": "923e666ee11f07df", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 466, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-04T05:01:57Z"}
{"id": 457, "parent_run_id": "af838ab93aa3d044", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 628, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-04T05:01:57Z"}
{"id": 458, "parent_run_id": "af838ab93aa3d044", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 1099, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-04T05:01:58Z"}
{"id": 459, "parent_run_id": "af838ab93aa3d044", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 483, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-04T05:01:59Z"}
{"id": 460, "parent_run_id": "a6b912ef230396a6", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 661, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-04T05:01:59Z"}
{"id": 461, "parent_run_id": "a6b912ef230396a6", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 590, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-04T05:02:00Z"}
{"id": 462, "parent_run_id": "a6b912ef230396a6", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 445, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-04T05:02:01Z"}
{"id": 463, "parent_run_id": "153bf64b2719607c", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 849, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-04T05:02:01Z"}
{"id": 464, "parent_run_id": "153bf64b2719607c", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1226, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-04T05:02:03Z"}
{"id": 465, "parent_run_id": "153bf64b2719607c", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 364, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-04T05:02:03Z"}
{"id": 466, "parent_run_id": "ae24ae06526fd053", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 715, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-04T05:02:04Z"}
{"id": 467, "parent_run_id": "ae24ae06526fd053", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1452, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-04T05:02:05Z"}
{"id": 468, "parent_run_id": "ae24ae06526fd053", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 871, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-04T05:02:06Z"}
{"id": 469, "parent_run_id": "4958ea3abb1ca1d8", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 566, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-04T05:02:07Z"}
{"id": 470, "parent_run_id": "4958ea3abb1ca1d8", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2621, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-04T05:02:09Z"}
{"id": 471, "parent_run_id": "4958ea3abb1ca1d8", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1200, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-04T05:02:10Z"}
{"id": 472, "parent_run_id": "d49733b20cfad736", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 515, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-04T05:02:11Z"}
{"id": 473, "parent_run_id": "d49733b20cfad736", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 648, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-04T05:02:12Z"}
{"id": 474, "parent_run_id": "d49733b20cfad736", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 354, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-04T05:02:12Z"}
{"id": 475, "parent_run_id": "4fde0349fdf3092e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 467, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-04T05:02:12Z"}
{"id": 476, "parent_run_id": "4fde0349fdf3092e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1228, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-04T05:02:14Z"}
{"id": 477, "parent_run_id": "4fde0349fdf3092e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 632, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-04T05:02:14Z"}
{"id": 478, "parent_run_id": "07db12f072c00b34", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 700, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-04T05:02:15Z"}
{"id": 479, "parent_run_id": "07db12f072c00b34", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2253, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-04T05:02:17Z"}
{"id": 480, "parent_run_id": "07db12f072c00b34", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 832, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-04T05:02:18Z"}
{"id": 481, "parent_run_id": "ba4d41e1f477b00f", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 743, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-04T05:02:19Z"}
{"id": 482, "parent_run_id": "3c556bf33f968afa", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 977, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-04T05:02:20Z"}
{"id": 483, "parent_run_id": "eea52049a44500e8", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 539, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-04T05:02:20Z"}
{"id": 484, "parent_run_id": "d8d761f3b4c91f0e", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 837, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-04T05:02:21Z"}
{"id": 485, "parent_run_id": "805deca8ff617394", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 849, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-04T05:02:22Z"}
{"id": 486, "parent_run_id": "7f243dea0c191a78", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 677, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-04T05:02:23Z"}
{"id": 530, "parent_run_id": "101dad2a4b0a6e56", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 2207, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-05T05:02:04Z"}
{"id": 531, "parent_run_id": "101dad2a4b0a6e56", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1245, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-05T05:02:06Z"}
{"id": 532, "parent_run_id": "101dad2a4b0a6e56", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1062, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-05T05:02:07Z"}
{"id": 533, "parent_run_id": "52e447619f3d2574", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 681, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-05T05:02:07Z"}
{"id": 534, "parent_run_id": "52e447619f3d2574", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 957, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-05T05:02:08Z"}
{"id": 535, "parent_run_id": "52e447619f3d2574", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 441, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-05T05:02:09Z"}
{"id": 536, "parent_run_id": "e37fc0051818372a", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 892, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-05T05:02:10Z"}
{"id": 537, "parent_run_id": "e37fc0051818372a", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2466, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-05T05:02:12Z"}
{"id": 538, "parent_run_id": "e37fc0051818372a", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1696, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-05T05:02:14Z"}
{"id": 539, "parent_run_id": "ec6c90078b2f3603", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 784, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-05T05:02:15Z"}
{"id": 540, "parent_run_id": "f4724e7e2ae04f75", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 738, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-05T05:02:15Z"}
{"id": 541, "parent_run_id": "6b8f336c753b21be", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 907, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-05T05:02:16Z"}
{"id": 542, "parent_run_id": "d6e4d23223bfa930", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 991, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-05T05:02:17Z"}
{"id": 543, "parent_run_id": "d6e4d23223bfa930", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 815, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-05T05:02:18Z"}
{"id": 544, "parent_run_id": "d6e4d23223bfa930", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 646, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-05T05:02:19Z"}
{"id": 545, "parent_run_id": "77a63bbcffa6fed4", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 646, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-05T05:02:19Z"}
{"id": 546, "parent_run_id": "77a63bbcffa6fed4", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 903, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-05T05:02:20Z"}
{"id": 547, "parent_run_id": "77a63bbcffa6fed4", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 779, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-05T05:02:21Z"}
{"id": 548, "parent_run_id": "adf1b5ac8753f176", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 634, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-05T05:02:22Z"}
{"id": 549, "parent_run_id": "adf1b5ac8753f176", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 564, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-05T05:02:22Z"}
{"id": 550, "parent_run_id": "adf1b5ac8753f176", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 444, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-05T05:02:23Z"}
{"id": 551, "parent_run_id": "986a4e4bb4286ade", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 870, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-05T05:02:24Z"}
{"id": 552, "parent_run_id": "986a4e4bb4286ade", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 589, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-05T05:02:24Z"}
{"id": 553, "parent_run_id": "986a4e4bb4286ade", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 794, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-05T05:02:25Z"}
{"id": 554, "parent_run_id": "3bf275f5634283d3", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 735, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-05T05:02:26Z"}
{"id": 555, "parent_run_id": "3bf275f5634283d3", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 672, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-05T05:02:26Z"}
{"id": 556, "parent_run_id": "3bf275f5634283d3", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 578, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-05T05:02:27Z"}
{"id": 557, "parent_run_id": "4dee8a74deab21ca", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 691, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-05T05:02:28Z"}
{"id": 558, "parent_run_id": "4dee8a74deab21ca", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 809, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-05T05:02:28Z"}
{"id": 559, "parent_run_id": "4dee8a74deab21ca", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 836, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-05T05:02:29Z"}
{"id": 560, "parent_run_id": "aae94a15127df223", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 516, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-05T05:02:30Z"}
{"id": 561, "parent_run_id": "aae94a15127df223", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1312, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-05T05:02:31Z"}
{"id": 562, "parent_run_id": "aae94a15127df223", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1929, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-05T05:02:33Z"}
{"id": 563, "parent_run_id": "17ca23de2a2e66f8", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 655, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-05T05:02:34Z"}
{"id": 564, "parent_run_id": "17ca23de2a2e66f8", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1141, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-05T05:02:35Z"}
{"id": 565, "parent_run_id": "17ca23de2a2e66f8", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 470, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-05T05:02:35Z"}
{"id": 566, "parent_run_id": "b21a27608805ecdc", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 753, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-05T05:02:36Z"}
{"id": 567, "parent_run_id": "b21a27608805ecdc", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Positive", "expected": "neutral", "correct": 0, "latency_ms": 3276, "input_tokens": 9, "output_tokens": 2, "cost_eur": 1.2749999999999999e-06, "error": null, "created_at": "2026-05-05T05:02:39Z"}
{"id": 568, "parent_run_id": "b21a27608805ecdc", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1022, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-05T05:02:40Z"}
{"id": 569, "parent_run_id": "cd1f33b4f7ec411f", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 775, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-05T05:02:41Z"}
{"id": 570, "parent_run_id": "cd1f33b4f7ec411f", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 882, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-05T05:02:42Z"}
{"id": 571, "parent_run_id": "cd1f33b4f7ec411f", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 529, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-05T05:02:43Z"}
{"id": 572, "parent_run_id": "0a8d88c66cd3b914", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 541, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-05T05:02:43Z"}
{"id": 573, "parent_run_id": "0a8d88c66cd3b914", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1460, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-05T05:02:45Z"}
{"id": 574, "parent_run_id": "0a8d88c66cd3b914", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 608, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-05T05:02:45Z"}
{"id": 575, "parent_run_id": "c024123b2fda33b4", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 516, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-05T05:02:46Z"}
{"id": 576, "parent_run_id": "c024123b2fda33b4", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2402, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-05T05:02:48Z"}
{"id": 577, "parent_run_id": "c024123b2fda33b4", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 568, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-05T05:02:49Z"}
{"id": 578, "parent_run_id": "2c81aec67081b8a1", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 1257, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-05T05:02:50Z"}
{"id": 579, "parent_run_id": "bbb6a75166d6fb2b", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 705, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-05T05:02:51Z"}
{"id": 580, "parent_run_id": "d3a9a87a6eafd907", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 724, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-05T05:02:52Z"}
{"id": 581, "parent_run_id": "523538da10626f3b", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 772, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-05T05:02:52Z"}
{"id": 582, "parent_run_id": "28e3d58e6d2c22f7", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 823, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-05T05:02:53Z"}
{"id": 583, "parent_run_id": "d0e33be5e0233dcb", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 741, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-05T05:02:54Z"}
{"id": 596, "parent_run_id": "656f848f7802fdcc", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1293, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-06T05:03:59Z"}
{"id": 597, "parent_run_id": "656f848f7802fdcc", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1352, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-06T05:04:01Z"}
{"id": 598, "parent_run_id": "656f848f7802fdcc", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1673, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-06T05:04:02Z"}
{"id": 599, "parent_run_id": "e064533a105bcc73", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 852, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-06T05:04:03Z"}
{"id": 600, "parent_run_id": "e064533a105bcc73", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1124, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-06T05:04:04Z"}
{"id": 601, "parent_run_id": "e064533a105bcc73", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 930, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-06T05:04:05Z"}
{"id": 602, "parent_run_id": "a330df5f5097082e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 642, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-06T05:04:06Z"}
{"id": 603, "parent_run_id": "a330df5f5097082e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1609, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-06T05:04:08Z"}
{"id": 604, "parent_run_id": "a330df5f5097082e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 379, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-06T05:04:08Z"}
{"id": 605, "parent_run_id": "6872ba4f6841ad9c", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 775, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-06T05:04:09Z"}
{"id": 606, "parent_run_id": "f87e7550aeed06b7", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 826, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-06T05:04:10Z"}
{"id": 607, "parent_run_id": "dba76ef852eab36b", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 1665, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-06T05:04:11Z"}
{"id": 608, "parent_run_id": "5547b2970c69aa03", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 662, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-06T05:04:12Z"}
{"id": 609, "parent_run_id": "5547b2970c69aa03", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 801, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-06T05:04:13Z"}
{"id": 610, "parent_run_id": "5547b2970c69aa03", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 750, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-06T05:04:14Z"}
{"id": 611, "parent_run_id": "402407843237acb5", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 638, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-06T05:04:14Z"}
{"id": 612, "parent_run_id": "402407843237acb5", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 622, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-06T05:04:15Z"}
{"id": 613, "parent_run_id": "402407843237acb5", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 401, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-06T05:04:15Z"}
{"id": 614, "parent_run_id": "97c0b9a19403d4a3", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 611, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-06T05:04:16Z"}
{"id": 615, "parent_run_id": "97c0b9a19403d4a3", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 701, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-06T05:04:17Z"}
{"id": 616, "parent_run_id": "97c0b9a19403d4a3", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 384, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-06T05:04:17Z"}
{"id": 617, "parent_run_id": "230ff5967f9e40bc", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 623, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-06T05:04:18Z"}
{"id": 618, "parent_run_id": "230ff5967f9e40bc", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 767, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-06T05:04:18Z"}
{"id": 619, "parent_run_id": "230ff5967f9e40bc", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 448, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-06T05:04:19Z"}
{"id": 620, "parent_run_id": "144ff3de8c2f0e19", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 929, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-06T05:04:20Z"}
{"id": 621, "parent_run_id": "144ff3de8c2f0e19", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 564, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-06T05:04:20Z"}
{"id": 622, "parent_run_id": "144ff3de8c2f0e19", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 386, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-06T05:04:21Z"}
{"id": 623, "parent_run_id": "7d527d2453f0f8bb", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 894, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-06T05:04:22Z"}
{"id": 624, "parent_run_id": "7d527d2453f0f8bb", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 655, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-06T05:04:22Z"}
{"id": 625, "parent_run_id": "7d527d2453f0f8bb", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 771, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-06T05:04:23Z"}
{"id": 626, "parent_run_id": "fc673e6c4ee2c8e1", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 635, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-06T05:04:24Z"}
{"id": 627, "parent_run_id": "fc673e6c4ee2c8e1", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1086, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-06T05:04:25Z"}
{"id": 628, "parent_run_id": "fc673e6c4ee2c8e1", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 422, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-06T05:04:25Z"}
{"id": 629, "parent_run_id": "af3aa7a225f36e8e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 830, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-06T05:04:26Z"}
{"id": 630, "parent_run_id": "af3aa7a225f36e8e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1103, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-06T05:04:27Z"}
{"id": 631, "parent_run_id": "af3aa7a225f36e8e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 455, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-06T05:04:28Z"}
{"id": 632, "parent_run_id": "dac1e16b0b7f6add", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 789, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-06T05:04:28Z"}
{"id": 633, "parent_run_id": "dac1e16b0b7f6add", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2228, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-06T05:04:31Z"}
{"id": 634, "parent_run_id": "dac1e16b0b7f6add", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 399, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-06T05:04:31Z"}
{"id": 635, "parent_run_id": "7a130e52a8d1101d", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 638, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-06T05:04:32Z"}
{"id": 636, "parent_run_id": "7a130e52a8d1101d", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 889, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-06T05:04:33Z"}
{"id": 637, "parent_run_id": "7a130e52a8d1101d", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 502, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-06T05:04:33Z"}
{"id": 638, "parent_run_id": "6a7d16a84ce48fa7", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 613, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-06T05:04:34Z"}
{"id": 639, "parent_run_id": "6a7d16a84ce48fa7", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1933, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-06T05:04:36Z"}
{"id": 640, "parent_run_id": "6a7d16a84ce48fa7", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1806, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-06T05:04:37Z"}
{"id": 641, "parent_run_id": "bc8aef7ea797e824", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 639, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-06T05:04:38Z"}
{"id": 642, "parent_run_id": "bc8aef7ea797e824", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2153, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-06T05:04:40Z"}
{"id": 643, "parent_run_id": "bc8aef7ea797e824", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 785, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-06T05:04:41Z"}
{"id": 644, "parent_run_id": "5ec8ef75570d2948", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 841, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-06T05:04:42Z"}
{"id": 645, "parent_run_id": "df0218f7349a6dd7", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 819, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-06T05:04:43Z"}
{"id": 646, "parent_run_id": "c465b919b3e345e5", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 663, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-06T05:04:43Z"}
{"id": 647, "parent_run_id": "e1367e4bebbe2685", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 760, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-06T05:04:44Z"}
{"id": 648, "parent_run_id": "d0443754612aa1fd", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 977, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-06T05:04:45Z"}
{"id": 649, "parent_run_id": "5d4683fc121d2f92", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 833, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-06T05:04:46Z"}
{"id": 653, "parent_run_id": "b23fb6ea5ef5bf42", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1488, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-07T05:04:26Z"}
{"id": 654, "parent_run_id": "b23fb6ea5ef5bf42", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 632, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-07T05:04:27Z"}
{"id": 655, "parent_run_id": "b23fb6ea5ef5bf42", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1834, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-07T05:04:28Z"}
{"id": 656, "parent_run_id": "7d7053fff66c0ecf", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 776, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-07T05:04:29Z"}
{"id": 657, "parent_run_id": "7d7053fff66c0ecf", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1091, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-07T05:04:30Z"}
{"id": 658, "parent_run_id": "7d7053fff66c0ecf", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 571, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-07T05:04:31Z"}
{"id": 659, "parent_run_id": "cccf378c12505681", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 661, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-07T05:04:32Z"}
{"id": 660, "parent_run_id": "cccf378c12505681", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2483, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-07T05:04:34Z"}
{"id": 661, "parent_run_id": "cccf378c12505681", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 473, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-07T05:04:35Z"}
{"id": 662, "parent_run_id": "37ee1d4beb6cbe42", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 835, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-07T05:04:35Z"}
{"id": 663, "parent_run_id": "10aaf4320b90d09b", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 681, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-07T05:04:36Z"}
{"id": 664, "parent_run_id": "ab53bc9b50b3eeee", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 701, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-07T05:04:37Z"}
{"id": 665, "parent_run_id": "c66ef0e298205d03", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 660, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-07T05:04:37Z"}
{"id": 666, "parent_run_id": "c66ef0e298205d03", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 1055, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-07T05:04:38Z"}
{"id": 667, "parent_run_id": "c66ef0e298205d03", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 457, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-07T05:04:39Z"}
{"id": 668, "parent_run_id": "ce750f977a0b1e87", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 839, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-07T05:04:40Z"}
{"id": 669, "parent_run_id": "ce750f977a0b1e87", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 888, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-07T05:04:41Z"}
{"id": 670, "parent_run_id": "ce750f977a0b1e87", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 864, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-07T05:04:42Z"}
{"id": 671, "parent_run_id": "04476896abf2cbd3", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 683, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-07T05:04:42Z"}
{"id": 672, "parent_run_id": "04476896abf2cbd3", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 604, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-07T05:04:43Z"}
{"id": 673, "parent_run_id": "04476896abf2cbd3", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 757, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-07T05:04:44Z"}
{"id": 674, "parent_run_id": "0dbb9b94f19a3160", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 652, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-07T05:04:44Z"}
{"id": 675, "parent_run_id": "0dbb9b94f19a3160", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 638, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-07T05:04:45Z"}
{"id": 676, "parent_run_id": "0dbb9b94f19a3160", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 649, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-07T05:04:46Z"}
{"id": 677, "parent_run_id": "d63e5f3b03884c21", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 1311, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-07T05:04:47Z"}
{"id": 678, "parent_run_id": "d63e5f3b03884c21", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 983, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-07T05:04:48Z"}
{"id": 679, "parent_run_id": "d63e5f3b03884c21", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 699, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-07T05:04:49Z"}
{"id": 680, "parent_run_id": "e28a7359484c5fea", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 674, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-07T05:04:49Z"}
{"id": 681, "parent_run_id": "e28a7359484c5fea", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 742, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-07T05:04:50Z"}
{"id": 682, "parent_run_id": "e28a7359484c5fea", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 808, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-07T05:04:51Z"}
{"id": 683, "parent_run_id": "4877dee45ff959e8", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 771, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-07T05:04:52Z"}
{"id": 684, "parent_run_id": "4877dee45ff959e8", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1571, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-07T05:04:53Z"}
{"id": 685, "parent_run_id": "4877dee45ff959e8", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 969, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-07T05:04:54Z"}
{"id": 686, "parent_run_id": "da768ced46a8ade6", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 669, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-07T05:04:55Z"}
{"id": 687, "parent_run_id": "da768ced46a8ade6", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1259, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-07T05:04:56Z"}
{"id": 688, "parent_run_id": "da768ced46a8ade6", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 526, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-07T05:04:57Z"}
{"id": 689, "parent_run_id": "59621747814f5902", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "positive", "expected": "neutral", "correct": 0, "latency_ms": 645, "input_tokens": 9, "output_tokens": 2, "cost_eur": 4.75e-06, "error": null, "created_at": "2026-05-07T05:04:57Z"}
{"id": 690, "parent_run_id": "59621747814f5902", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2360, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-07T05:05:00Z"}
{"id": 691, "parent_run_id": "59621747814f5902", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 974, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-07T05:05:01Z"}
{"id": 692, "parent_run_id": "bfbced0c371d081e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 795, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-07T05:05:01Z"}
{"id": 693, "parent_run_id": "bfbced0c371d081e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 738, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-07T05:05:02Z"}
{"id": 694, "parent_run_id": "bfbced0c371d081e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 892, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-07T05:05:03Z"}
{"id": 695, "parent_run_id": "aec50dc82dcb2ff2", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 772, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-07T05:05:04Z"}
{"id": 696, "parent_run_id": "aec50dc82dcb2ff2", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1943, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-07T05:05:06Z"}
{"id": 697, "parent_run_id": "aec50dc82dcb2ff2", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 687, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-07T05:05:07Z"}
{"id": 698, "parent_run_id": "6e1ce94881136be3", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 879, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-07T05:05:07Z"}
{"id": 699, "parent_run_id": "6e1ce94881136be3", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2175, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-07T05:05:10Z"}
{"id": 700, "parent_run_id": "6e1ce94881136be3", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 608, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-07T05:05:10Z"}
{"id": 701, "parent_run_id": "1b981dce399857d3", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 795, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-07T05:05:11Z"}
{"id": 702, "parent_run_id": "4089bf3c0f979bcc", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 698, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-07T05:05:12Z"}
{"id": 703, "parent_run_id": "06783117002f643c", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 714, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-07T05:05:12Z"}
{"id": 704, "parent_run_id": "8b9f0fd9b41eaf5b", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 729, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-07T05:05:13Z"}
{"id": 705, "parent_run_id": "64672631f9118eaa", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 717, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-07T05:05:14Z"}
{"id": 706, "parent_run_id": "b0f65a11a8d36581", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 711, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-07T05:05:15Z"}
{"id": 708, "parent_run_id": "c2ccddd55d8869af", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1541, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-08T05:00:18Z"}
{"id": 709, "parent_run_id": "c2ccddd55d8869af", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 868, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-08T05:00:19Z"}
{"id": 710, "parent_run_id": "c2ccddd55d8869af", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 3660, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-08T05:00:22Z"}
{"id": 711, "parent_run_id": "c17c0c9b2622b3c9", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 676, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-08T05:00:23Z"}
{"id": 712, "parent_run_id": "c17c0c9b2622b3c9", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 905, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-08T05:00:24Z"}
{"id": 713, "parent_run_id": "c17c0c9b2622b3c9", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 566, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-08T05:00:25Z"}
{"id": 714, "parent_run_id": "06420d6e72ec12ec", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 606, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-08T05:00:25Z"}
{"id": 715, "parent_run_id": "06420d6e72ec12ec", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 2209, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-08T05:00:27Z"}
{"id": 716, "parent_run_id": "06420d6e72ec12ec", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1343, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-08T05:00:29Z"}
{"id": 717, "parent_run_id": "b65476cc9aea3028", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 763, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-08T05:00:30Z"}
{"id": 718, "parent_run_id": "046240bff7e3045d", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 690, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-08T05:00:30Z"}
{"id": 719, "parent_run_id": "693beb7f2a21a9db", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 613, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-08T05:00:31Z"}
{"id": 720, "parent_run_id": "ac262ba2a0c0dde0", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 646, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-08T05:00:32Z"}
{"id": 721, "parent_run_id": "ac262ba2a0c0dde0", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 889, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-08T05:00:32Z"}
{"id": 722, "parent_run_id": "ac262ba2a0c0dde0", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 1066, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-08T05:00:33Z"}
{"id": 723, "parent_run_id": "bd2ef639e253c4d7", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 594, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-08T05:00:34Z"}
{"id": 724, "parent_run_id": "bd2ef639e253c4d7", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 1110, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-08T05:00:35Z"}
{"id": 725, "parent_run_id": "bd2ef639e253c4d7", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 523, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-08T05:00:36Z"}
{"id": 726, "parent_run_id": "ed7f83fb06722847", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 598, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-08T05:00:36Z"}
{"id": 727, "parent_run_id": "ed7f83fb06722847", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 965, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-08T05:00:37Z"}
{"id": 728, "parent_run_id": "ed7f83fb06722847", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 2049, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-08T05:00:39Z"}
{"id": 729, "parent_run_id": "9b96a189cccfde73", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 788, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-08T05:00:40Z"}
{"id": 730, "parent_run_id": "9b96a189cccfde73", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 742, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-08T05:00:41Z"}
{"id": 731, "parent_run_id": "9b96a189cccfde73", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 790, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-08T05:00:42Z"}
{"id": 732, "parent_run_id": "c65c10c1a24dfff9", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 624, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-08T05:00:42Z"}
{"id": 733, "parent_run_id": "c65c10c1a24dfff9", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 2057, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-08T05:00:44Z"}
{"id": 734, "parent_run_id": "c65c10c1a24dfff9", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 1063, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-08T05:00:45Z"}
{"id": 735, "parent_run_id": "7c8d859bec878e06", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 623, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-08T05:00:46Z"}
{"id": 736, "parent_run_id": "7c8d859bec878e06", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 927, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-08T05:00:47Z"}
{"id": 737, "parent_run_id": "7c8d859bec878e06", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 711, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-08T05:00:48Z"}
{"id": 738, "parent_run_id": "c4ad8e2583fea550", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 778, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-08T05:00:49Z"}
{"id": 739, "parent_run_id": "c4ad8e2583fea550", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1113, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-08T05:00:50Z"}
{"id": 740, "parent_run_id": "c4ad8e2583fea550", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 2043, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-08T05:00:52Z"}
{"id": 741, "parent_run_id": "9d33be8d5591bd25", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 649, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-08T05:00:52Z"}
{"id": 742, "parent_run_id": "9d33be8d5591bd25", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 872, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-08T05:00:53Z"}
{"id": 743, "parent_run_id": "9d33be8d5591bd25", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1044, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-08T05:00:54Z"}
{"id": 744, "parent_run_id": "4782c16287865e37", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 668, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-08T05:00:55Z"}
{"id": 745, "parent_run_id": "4782c16287865e37", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2262, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-08T05:00:57Z"}
{"id": 746, "parent_run_id": "4782c16287865e37", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 945, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-08T05:00:58Z"}
{"id": 747, "parent_run_id": "5d08f0d769b04ee8", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 612, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-08T05:00:59Z"}
{"id": 748, "parent_run_id": "5d08f0d769b04ee8", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1270, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-08T05:01:00Z"}
{"id": 749, "parent_run_id": "5d08f0d769b04ee8", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1396, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-08T05:01:01Z"}
{"id": 750, "parent_run_id": "cf2d6994dcb90c0f", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 617, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-08T05:01:02Z"}
{"id": 751, "parent_run_id": "cf2d6994dcb90c0f", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1003, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-08T05:01:03Z"}
{"id": 752, "parent_run_id": "cf2d6994dcb90c0f", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 844, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-08T05:01:04Z"}
{"id": 753, "parent_run_id": "e3e77e1578545682", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 615, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-08T05:01:05Z"}
{"id": 754, "parent_run_id": "e3e77e1578545682", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2122, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-08T05:01:07Z"}
{"id": 755, "parent_run_id": "e3e77e1578545682", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 522, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-08T05:01:07Z"}
{"id": 756, "parent_run_id": "375bfc0eefde874e", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 722, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-08T05:01:08Z"}
{"id": 757, "parent_run_id": "762038fcff7a56b7", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 675, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-08T05:01:09Z"}
{"id": 758, "parent_run_id": "8c960c99042e947d", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 636, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-08T05:01:09Z"}
{"id": 759, "parent_run_id": "cb3eb7fdf4a43f71", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 1341, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-08T05:01:11Z"}
{"id": 760, "parent_run_id": "fa11fd352f754c1a", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 786, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-08T05:01:11Z"}
{"id": 761, "parent_run_id": "f6d45c002eef9ae0", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 659, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-08T05:01:12Z"}
{"id": 763, "parent_run_id": "aafab3c42313ff19", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1670, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-09T05:03:17Z"}
{"id": 764, "parent_run_id": "aafab3c42313ff19", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1173, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-09T05:03:18Z"}
{"id": 765, "parent_run_id": "aafab3c42313ff19", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 778, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-09T05:03:19Z"}
{"id": 766, "parent_run_id": "64a0aa0158eb6527", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 798, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-09T05:03:20Z"}
{"id": 767, "parent_run_id": "64a0aa0158eb6527", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1271, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-09T05:03:21Z"}
{"id": 768, "parent_run_id": "64a0aa0158eb6527", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 2018, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-09T05:03:23Z"}
{"id": 769, "parent_run_id": "c52aac67ea9920b1", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 1298, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-09T05:03:24Z"}
{"id": 770, "parent_run_id": "c52aac67ea9920b1", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2292, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-09T05:03:27Z"}
{"id": 771, "parent_run_id": "c52aac67ea9920b1", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 914, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-09T05:03:28Z"}
{"id": 772, "parent_run_id": "9e4ed8b730537870", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 1278, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-09T05:03:29Z"}
{"id": 773, "parent_run_id": "78512cd3997159ad", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 1586, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-09T05:03:30Z"}
{"id": 774, "parent_run_id": "96d7344b15892b2d", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 663, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-09T05:03:31Z"}
{"id": 775, "parent_run_id": "4686e1f1de62e44f", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 686, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-09T05:03:32Z"}
{"id": 776, "parent_run_id": "4686e1f1de62e44f", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 717, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-09T05:03:33Z"}
{"id": 777, "parent_run_id": "4686e1f1de62e44f", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 736, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-09T05:03:33Z"}
{"id": 778, "parent_run_id": "0749e122b44b451c", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 785, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-09T05:03:34Z"}
{"id": 779, "parent_run_id": "0749e122b44b451c", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 666, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-09T05:03:35Z"}
{"id": 780, "parent_run_id": "0749e122b44b451c", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 1793, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-09T05:03:37Z"}
{"id": 781, "parent_run_id": "07c0a3bb57867582", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 680, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-09T05:03:37Z"}
{"id": 782, "parent_run_id": "07c0a3bb57867582", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 578, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-09T05:03:38Z"}
{"id": 783, "parent_run_id": "07c0a3bb57867582", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 555, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-09T05:03:38Z"}
{"id": 784, "parent_run_id": "de371a21f9818771", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 652, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-09T05:03:39Z"}
{"id": 785, "parent_run_id": "de371a21f9818771", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 721, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-09T05:03:40Z"}
{"id": 786, "parent_run_id": "de371a21f9818771", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 722, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-09T05:03:40Z"}
{"id": 787, "parent_run_id": "0dd6fae03dd5a412", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 1102, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-09T05:03:42Z"}
{"id": 788, "parent_run_id": "0dd6fae03dd5a412", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 720, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-09T05:03:42Z"}
{"id": 789, "parent_run_id": "0dd6fae03dd5a412", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 532, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-09T05:03:43Z"}
{"id": 790, "parent_run_id": "9271d0ed4dd064f7", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 1036, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-09T05:03:44Z"}
{"id": 791, "parent_run_id": "9271d0ed4dd064f7", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 711, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-09T05:03:45Z"}
{"id": 792, "parent_run_id": "9271d0ed4dd064f7", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 946, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-09T05:03:46Z"}
{"id": 793, "parent_run_id": "a2ce02a02ca34a17", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 923, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-09T05:03:46Z"}
{"id": 794, "parent_run_id": "a2ce02a02ca34a17", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1430, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-09T05:03:48Z"}
{"id": 795, "parent_run_id": "a2ce02a02ca34a17", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 480, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-09T05:03:48Z"}
{"id": 796, "parent_run_id": "9f585d6ffae97b78", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 827, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-09T05:03:49Z"}
{"id": 797, "parent_run_id": "9f585d6ffae97b78", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1279, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-09T05:03:51Z"}
{"id": 798, "parent_run_id": "9f585d6ffae97b78", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 557, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-09T05:03:51Z"}
{"id": 799, "parent_run_id": "d332f066444833db", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 606, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-09T05:03:52Z"}
{"id": 800, "parent_run_id": "d332f066444833db", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2079, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-09T05:03:54Z"}
{"id": 801, "parent_run_id": "d332f066444833db", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 847, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-09T05:03:55Z"}
{"id": 802, "parent_run_id": "679dba45daa8c116", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 888, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-09T05:03:56Z"}
{"id": 803, "parent_run_id": "679dba45daa8c116", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 622, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-09T05:03:56Z"}
{"id": 804, "parent_run_id": "679dba45daa8c116", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 487, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-09T05:03:57Z"}
{"id": 805, "parent_run_id": "75f29641a4261600", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 709, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-09T05:03:57Z"}
{"id": 806, "parent_run_id": "75f29641a4261600", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1334, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-09T05:03:59Z"}
{"id": 807, "parent_run_id": "75f29641a4261600", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 570, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-09T05:03:59Z"}
{"id": 808, "parent_run_id": "3adef3a855801596", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 732, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-09T05:04:00Z"}
{"id": 809, "parent_run_id": "3adef3a855801596", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 3112, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-09T05:04:03Z"}
{"id": 810, "parent_run_id": "3adef3a855801596", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 599, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-09T05:04:04Z"}
{"id": 811, "parent_run_id": "d9907e7bed558478", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 716, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-09T05:04:04Z"}
{"id": 812, "parent_run_id": "cc1b32f177cb2213", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 694, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-09T05:04:05Z"}
{"id": 813, "parent_run_id": "82ee0107488c9a9f", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 920, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-09T05:04:06Z"}
{"id": 814, "parent_run_id": "c997aeeca36bd566", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 784, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-09T05:04:07Z"}
{"id": 815, "parent_run_id": "8b6d8d889e17558e", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 784, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-09T05:04:08Z"}
{"id": 816, "parent_run_id": "c3edffeb9e571994", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 740, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-09T05:04:08Z"}
{"id": 818, "parent_run_id": "6a914f9d8cca88e6", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1369, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-10T05:03:01Z"}
{"id": 819, "parent_run_id": "6a914f9d8cca88e6", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 758, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-10T05:03:02Z"}
{"id": 820, "parent_run_id": "6a914f9d8cca88e6", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1006, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-10T05:03:03Z"}
{"id": 821, "parent_run_id": "a352c75767bc39cb", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1305, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-10T05:03:04Z"}
{"id": 822, "parent_run_id": "a352c75767bc39cb", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 643, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-10T05:03:05Z"}
{"id": 823, "parent_run_id": "a352c75767bc39cb", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 420, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-10T05:03:05Z"}
{"id": 824, "parent_run_id": "59b0be8c21d919d0", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 703, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-10T05:03:06Z"}
{"id": 825, "parent_run_id": "59b0be8c21d919d0", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2294, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-10T05:03:08Z"}
{"id": 826, "parent_run_id": "59b0be8c21d919d0", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2687, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-10T05:03:11Z"}
{"id": 827, "parent_run_id": "69c54d6216ef4f4d", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 747, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-10T05:03:11Z"}
{"id": 828, "parent_run_id": "77c723c96163d2c3", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 654, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-10T05:03:12Z"}
{"id": 829, "parent_run_id": "7dc85c8f173fb5bc", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 750, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-10T05:03:13Z"}
{"id": 830, "parent_run_id": "bab84406919424ee", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 657, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-10T05:03:13Z"}
{"id": 831, "parent_run_id": "bab84406919424ee", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 557, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-10T05:03:14Z"}
{"id": 832, "parent_run_id": "bab84406919424ee", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 1187, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-10T05:03:15Z"}
{"id": 833, "parent_run_id": "b8204a65909500cd", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 611, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-10T05:03:16Z"}
{"id": 834, "parent_run_id": "b8204a65909500cd", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 662, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-10T05:03:17Z"}
{"id": 835, "parent_run_id": "b8204a65909500cd", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 605, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-10T05:03:17Z"}
{"id": 836, "parent_run_id": "6527c6c7ebd1dccf", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 610, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-10T05:03:18Z"}
{"id": 837, "parent_run_id": "6527c6c7ebd1dccf", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 1470, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-10T05:03:19Z"}
{"id": 838, "parent_run_id": "6527c6c7ebd1dccf", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 880, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-10T05:03:20Z"}
{"id": 839, "parent_run_id": "748f34e901ae4e42", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 595, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-10T05:03:21Z"}
{"id": 840, "parent_run_id": "748f34e901ae4e42", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 530, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-10T05:03:21Z"}
{"id": 841, "parent_run_id": "748f34e901ae4e42", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 797, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-10T05:03:22Z"}
{"id": 842, "parent_run_id": "b1ced658b3ae8b45", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 1268, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-10T05:03:23Z"}
{"id": 843, "parent_run_id": "b1ced658b3ae8b45", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 616, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-10T05:03:24Z"}
{"id": 844, "parent_run_id": "b1ced658b3ae8b45", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 866, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-10T05:03:25Z"}
{"id": 845, "parent_run_id": "8ad5bd4453b3439b", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 634, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-10T05:03:25Z"}
{"id": 846, "parent_run_id": "8ad5bd4453b3439b", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 1960, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-10T05:03:27Z"}
{"id": 847, "parent_run_id": "8ad5bd4453b3439b", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 399, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-10T05:03:28Z"}
{"id": 848, "parent_run_id": "1a1cb93efc3c6727", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 658, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-10T05:03:28Z"}
{"id": 849, "parent_run_id": "1a1cb93efc3c6727", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1068, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-10T05:03:30Z"}
{"id": 850, "parent_run_id": "1a1cb93efc3c6727", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 605, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-10T05:03:30Z"}
{"id": 851, "parent_run_id": "9611c8f8b823d318", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 630, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-10T05:03:31Z"}
{"id": 852, "parent_run_id": "9611c8f8b823d318", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 648, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-10T05:03:31Z"}
{"id": 853, "parent_run_id": "9611c8f8b823d318", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 498, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-10T05:03:32Z"}
{"id": 854, "parent_run_id": "a60619d58120c816", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 611, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-10T05:03:33Z"}
{"id": 855, "parent_run_id": "a60619d58120c816", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 2218, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-10T05:03:35Z"}
{"id": 856, "parent_run_id": "a60619d58120c816", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1332, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-10T05:03:36Z"}
{"id": 857, "parent_run_id": "4a8d4996d6c0cff0", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 768, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-10T05:03:37Z"}
{"id": 858, "parent_run_id": "4a8d4996d6c0cff0", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1062, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-10T05:03:38Z"}
{"id": 859, "parent_run_id": "4a8d4996d6c0cff0", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1082, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-10T05:03:39Z"}
{"id": 860, "parent_run_id": "fbfde6b8b396f919", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 739, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-10T05:03:40Z"}
{"id": 861, "parent_run_id": "fbfde6b8b396f919", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1067, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-10T05:03:41Z"}
{"id": 862, "parent_run_id": "fbfde6b8b396f919", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 568, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-10T05:03:41Z"}
{"id": 863, "parent_run_id": "ff6b74d6dbaeb2ca", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 608, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-10T05:03:42Z"}
{"id": 864, "parent_run_id": "ff6b74d6dbaeb2ca", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2202, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-10T05:03:44Z"}
{"id": 865, "parent_run_id": "ff6b74d6dbaeb2ca", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1261, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-10T05:03:46Z"}
{"id": 866, "parent_run_id": "099e67b1e4d567d6", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 781, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-10T05:03:46Z"}
{"id": 867, "parent_run_id": "c6b2d0480f4555ac", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 2604, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-10T05:03:49Z"}
{"id": 868, "parent_run_id": "58bebf714fc488a8", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 1238, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-10T05:03:50Z"}
{"id": 869, "parent_run_id": "a227e0ac170f6c2f", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 714, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-10T05:03:51Z"}
{"id": 870, "parent_run_id": "669f6e3d58bfd019", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 690, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-10T05:03:52Z"}
{"id": 871, "parent_run_id": "8880360844921eda", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 1147, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-10T05:03:53Z"}
{"id": 878, "parent_run_id": "8feee85ac427c5f3", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 2035, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-11T05:02:43Z"}
{"id": 879, "parent_run_id": "8feee85ac427c5f3", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 939, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-11T05:02:44Z"}
{"id": 880, "parent_run_id": "8feee85ac427c5f3", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1154, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-11T05:02:45Z"}
{"id": 881, "parent_run_id": "ff59938cbe27aead", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 859, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-11T05:02:46Z"}
{"id": 882, "parent_run_id": "ff59938cbe27aead", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1199, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-11T05:02:47Z"}
{"id": 883, "parent_run_id": "ff59938cbe27aead", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 830, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-11T05:02:48Z"}
{"id": 884, "parent_run_id": "7f8e99a52556948e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 752, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-11T05:02:48Z"}
{"id": 885, "parent_run_id": "7f8e99a52556948e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2664, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-11T05:02:51Z"}
{"id": 886, "parent_run_id": "7f8e99a52556948e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2126, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-11T05:02:53Z"}
{"id": 887, "parent_run_id": "80c37939ba9c927a", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 905, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-11T05:02:54Z"}
{"id": 888, "parent_run_id": "4bfe240f29d1e486", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 914, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-11T05:02:55Z"}
{"id": 889, "parent_run_id": "e38d0949cccfe3b0", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 668, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-11T05:02:56Z"}
{"id": 890, "parent_run_id": "406f210794807560", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 732, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-11T05:02:57Z"}
{"id": 891, "parent_run_id": "406f210794807560", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 634, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-11T05:02:57Z"}
{"id": 892, "parent_run_id": "406f210794807560", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 1074, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-11T05:02:58Z"}
{"id": 893, "parent_run_id": "520dd61766d2b7e9", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 703, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-11T05:02:59Z"}
{"id": 894, "parent_run_id": "520dd61766d2b7e9", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 627, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-11T05:03:00Z"}
{"id": 895, "parent_run_id": "520dd61766d2b7e9", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 1892, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-11T05:03:01Z"}
{"id": 896, "parent_run_id": "7bb5abe1bf1cd4b4", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 869, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-11T05:03:02Z"}
{"id": 897, "parent_run_id": "7bb5abe1bf1cd4b4", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 931, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-11T05:03:03Z"}
{"id": 898, "parent_run_id": "7bb5abe1bf1cd4b4", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 1214, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-11T05:03:05Z"}
{"id": 899, "parent_run_id": "e10de88337ff32e4", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 606, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-11T05:03:05Z"}
{"id": 900, "parent_run_id": "e10de88337ff32e4", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 577, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-11T05:03:06Z"}
{"id": 901, "parent_run_id": "e10de88337ff32e4", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 743, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-11T05:03:06Z"}
{"id": 902, "parent_run_id": "12fe85eb1a201abc", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 685, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-11T05:03:07Z"}
{"id": 903, "parent_run_id": "12fe85eb1a201abc", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 1108, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-11T05:03:08Z"}
{"id": 904, "parent_run_id": "12fe85eb1a201abc", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 959, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-11T05:03:09Z"}
{"id": 905, "parent_run_id": "c5934461e9839235", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 609, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-11T05:03:10Z"}
{"id": 906, "parent_run_id": "c5934461e9839235", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 709, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-11T05:03:11Z"}
{"id": 907, "parent_run_id": "c5934461e9839235", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 582, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-11T05:03:11Z"}
{"id": 908, "parent_run_id": "28e332c76a96e823", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 649, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-11T05:03:12Z"}
{"id": 909, "parent_run_id": "28e332c76a96e823", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 661, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-11T05:03:12Z"}
{"id": 910, "parent_run_id": "28e332c76a96e823", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1017, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-11T05:03:13Z"}
{"id": 911, "parent_run_id": "019fa7e2e6d9de97", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 662, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-11T05:03:14Z"}
{"id": 912, "parent_run_id": "019fa7e2e6d9de97", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1062, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-11T05:03:15Z"}
{"id": 913, "parent_run_id": "019fa7e2e6d9de97", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 568, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-11T05:03:16Z"}
{"id": 914, "parent_run_id": "fbb460fed7ae46df", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 717, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-11T05:03:17Z"}
{"id": 915, "parent_run_id": "fbb460fed7ae46df", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2444, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-11T05:03:19Z"}
{"id": 916, "parent_run_id": "fbb460fed7ae46df", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 667, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-11T05:03:20Z"}
{"id": 917, "parent_run_id": "0cb34a080c965662", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 729, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-11T05:03:20Z"}
{"id": 918, "parent_run_id": "0cb34a080c965662", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 953, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-11T05:03:21Z"}
{"id": 919, "parent_run_id": "0cb34a080c965662", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 634, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-11T05:03:22Z"}
{"id": 920, "parent_run_id": "070967f1b41d3d07", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 932, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-11T05:03:23Z"}
{"id": 921, "parent_run_id": "070967f1b41d3d07", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1584, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-11T05:03:25Z"}
{"id": 922, "parent_run_id": "070967f1b41d3d07", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 934, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-11T05:03:25Z"}
{"id": 923, "parent_run_id": "ad84f606fe3068a5", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 613, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-11T05:03:26Z"}
{"id": 924, "parent_run_id": "ad84f606fe3068a5", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1862, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-11T05:03:28Z"}
{"id": 925, "parent_run_id": "ad84f606fe3068a5", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 932, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-11T05:03:29Z"}
{"id": 926, "parent_run_id": "73a2154faadc8ebd", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 723, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-11T05:03:30Z"}
{"id": 927, "parent_run_id": "64989df9c581c164", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 1002, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-11T05:03:31Z"}
{"id": 928, "parent_run_id": "f26f3951f19c6737", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 789, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-11T05:03:31Z"}
{"id": 929, "parent_run_id": "d492223367c1de04", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 751, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-11T05:03:32Z"}
{"id": 930, "parent_run_id": "429a625ee51a8d7f", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 1409, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-11T05:03:34Z"}
{"id": 931, "parent_run_id": "42664af6d5a29d00", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 628, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-11T05:03:34Z"}
{"id": 941, "parent_run_id": "f1c5eaec138f5f63", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 1858, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-12T05:03:35Z"}
{"id": 942, "parent_run_id": "c10a6cff8eacf4b2", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 1873, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-12T05:03:37Z"}
{"id": 943, "parent_run_id": "bbb439c9a0f0ac7c", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 1596, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T05:03:39Z"}
{"id": 944, "parent_run_id": "e38650a335150868", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 724, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T05:03:40Z"}
{"id": 945, "parent_run_id": "e38650a335150868", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 695, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-12T05:03:40Z"}
{"id": 946, "parent_run_id": "e38650a335150868", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 2085, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-12T05:03:42Z"}
{"id": 947, "parent_run_id": "8d4c9bfd26faea37", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 744, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T05:03:43Z"}
{"id": 948, "parent_run_id": "8d4c9bfd26faea37", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1384, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-12T05:03:44Z"}
{"id": 949, "parent_run_id": "8d4c9bfd26faea37", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1723, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-12T05:03:46Z"}
{"id": 950, "parent_run_id": "b2186731c4a3a62a", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 954, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-12T05:03:47Z"}
{"id": 951, "parent_run_id": "b2186731c4a3a62a", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1660, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-12T05:03:49Z"}
{"id": 952, "parent_run_id": "b2186731c4a3a62a", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1217, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-12T05:03:50Z"}
{"id": 953, "parent_run_id": "da75badc48c004e9", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 721, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-12T05:03:51Z"}
{"id": 954, "parent_run_id": "da75badc48c004e9", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 884, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-12T05:03:52Z"}
{"id": 955, "parent_run_id": "da75badc48c004e9", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 2386, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-12T05:03:54Z"}
{"id": 956, "parent_run_id": "1fd06dd96d306f72", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 854, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-12T05:03:55Z"}
{"id": 957, "parent_run_id": "1fd06dd96d306f72", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 716, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-12T05:03:56Z"}
{"id": 958, "parent_run_id": "1fd06dd96d306f72", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 555, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-12T05:03:56Z"}
{"id": 959, "parent_run_id": "dd5d88077f31a9f9", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 841, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-12T05:03:57Z"}
{"id": 960, "parent_run_id": "dd5d88077f31a9f9", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 579, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-12T05:03:58Z"}
{"id": 961, "parent_run_id": "dd5d88077f31a9f9", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 580, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-12T05:03:58Z"}
{"id": 962, "parent_run_id": "c683449898a36f3d", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 828, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-12T05:03:59Z"}
{"id": 963, "parent_run_id": "c683449898a36f3d", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 900, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-12T05:04:00Z"}
{"id": 964, "parent_run_id": "c683449898a36f3d", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 807, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-12T05:04:01Z"}
{"id": 965, "parent_run_id": "800c0a18b6fce9c1", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 1020, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-12T05:04:02Z"}
{"id": 966, "parent_run_id": "800c0a18b6fce9c1", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 1122, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-12T05:04:03Z"}
{"id": 967, "parent_run_id": "800c0a18b6fce9c1", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 494, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-12T05:04:03Z"}
{"id": 968, "parent_run_id": "c724f0956ef91ad4", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 675, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-12T05:04:04Z"}
{"id": 969, "parent_run_id": "c724f0956ef91ad4", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 624, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-12T05:04:05Z"}
{"id": 970, "parent_run_id": "c724f0956ef91ad4", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 596, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-12T05:04:05Z"}
{"id": 971, "parent_run_id": "8b162fcfb6ba89ac", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 867, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T05:04:06Z"}
{"id": 972, "parent_run_id": "8b162fcfb6ba89ac", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1069, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-12T05:04:07Z"}
{"id": 973, "parent_run_id": "8b162fcfb6ba89ac", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 623, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-12T05:04:08Z"}
{"id": 974, "parent_run_id": "40c48ca967600c93", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 857, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T05:04:09Z"}
{"id": 975, "parent_run_id": "40c48ca967600c93", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1300, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-12T05:04:10Z"}
{"id": 976, "parent_run_id": "40c48ca967600c93", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1053, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-12T05:04:11Z"}
{"id": 977, "parent_run_id": "a77130be7c3214c7", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 960, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-12T05:04:12Z"}
{"id": 978, "parent_run_id": "a77130be7c3214c7", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Positive", "expected": "neutral", "correct": 0, "latency_ms": 2612, "input_tokens": 9, "output_tokens": 2, "cost_eur": 1.2749999999999999e-06, "error": null, "created_at": "2026-05-12T05:04:15Z"}
{"id": 979, "parent_run_id": "a77130be7c3214c7", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 814, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-12T05:04:16Z"}
{"id": 980, "parent_run_id": "7ec6ce9d1ea5cf71", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 909, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T05:04:17Z"}
{"id": 981, "parent_run_id": "7ec6ce9d1ea5cf71", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 605, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-12T05:04:17Z"}
{"id": 982, "parent_run_id": "7ec6ce9d1ea5cf71", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 582, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-12T05:04:18Z"}
{"id": 983, "parent_run_id": "9c340909114f2552", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 841, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T05:04:19Z"}
{"id": 984, "parent_run_id": "9c340909114f2552", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1358, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-12T05:04:20Z"}
{"id": 985, "parent_run_id": "9c340909114f2552", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 447, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-12T05:04:20Z"}
{"id": 986, "parent_run_id": "1f2f6e7813cc63ff", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 979, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-12T05:04:21Z"}
{"id": 987, "parent_run_id": "1f2f6e7813cc63ff", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Positive", "expected": "neutral", "correct": 0, "latency_ms": 2767, "input_tokens": 9, "output_tokens": 2, "cost_eur": 1.2749999999999999e-06, "error": null, "created_at": "2026-05-12T05:04:24Z"}
{"id": 988, "parent_run_id": "1f2f6e7813cc63ff", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 5570, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-12T05:04:30Z"}
{"id": 989, "parent_run_id": "786ad912bebf4cab", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 889, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-12T05:04:31Z"}
{"id": 990, "parent_run_id": "4b9862e7881e41f4", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 1499, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-12T05:04:32Z"}
{"id": 991, "parent_run_id": "11e6d4db0ca3dcc5", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 956, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T05:04:33Z"}
{"id": 992, "parent_run_id": "21b5119c0f613ee9", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 1050, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-12T05:04:34Z"}
{"id": 993, "parent_run_id": "ea0d2b7b34f5a530", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 788, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-12T05:04:35Z"}
{"id": 994, "parent_run_id": "3468bf08b8960ea2", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 873, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T05:04:36Z"}
{"id": 995, "parent_run_id": "608bc5b69b3912f5", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 1552, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-12T13:35:41Z"}
{"id": 996, "parent_run_id": "8f77ce236c4a5b2d", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 939, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-12T13:35:42Z"}
{"id": 997, "parent_run_id": "02c19df7c1d3523b", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 724, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T13:35:42Z"}
{"id": 998, "parent_run_id": "29aa85cacd828fd9", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 865, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T13:35:43Z"}
{"id": 999, "parent_run_id": "29aa85cacd828fd9", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1232, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-12T13:35:44Z"}
{"id": 1000, "parent_run_id": "29aa85cacd828fd9", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 2150, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-12T13:35:47Z"}
{"id": 1001, "parent_run_id": "9efd9824d03f7a9e", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 790, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T13:35:47Z"}
{"id": 1002, "parent_run_id": "9efd9824d03f7a9e", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1483, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-12T13:35:49Z"}
{"id": 1003, "parent_run_id": "9efd9824d03f7a9e", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1048, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-12T13:35:50Z"}
{"id": 1004, "parent_run_id": "bc6a70a2df7511aa", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 1288, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-12T13:35:51Z"}
{"id": 1005, "parent_run_id": "bc6a70a2df7511aa", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2131, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-12T13:35:53Z"}
{"id": 1006, "parent_run_id": "bc6a70a2df7511aa", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2375, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-12T13:35:56Z"}
{"id": 1007, "parent_run_id": "3ca117c544ae3cdc", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 1043, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-12T13:35:57Z"}
{"id": 1008, "parent_run_id": "3ca117c544ae3cdc", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 622, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-12T13:35:57Z"}
{"id": 1009, "parent_run_id": "3ca117c544ae3cdc", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 1032, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-12T13:35:58Z"}
{"id": 1010, "parent_run_id": "b6593e371bbe612b", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 804, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-12T13:35:59Z"}
{"id": 1011, "parent_run_id": "b6593e371bbe612b", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 714, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-12T13:36:00Z"}
{"id": 1012, "parent_run_id": "b6593e371bbe612b", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 644, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-12T13:36:01Z"}
{"id": 1013, "parent_run_id": "bdda6da6bc5a12f4", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 838, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-12T13:36:01Z"}
{"id": 1014, "parent_run_id": "bdda6da6bc5a12f4", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 713, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-12T13:36:02Z"}
{"id": 1015, "parent_run_id": "bdda6da6bc5a12f4", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 1072, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-12T13:36:03Z"}
{"id": 1016, "parent_run_id": "d81b65a1ed20dd9c", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 882, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-12T13:36:04Z"}
{"id": 1017, "parent_run_id": "d81b65a1ed20dd9c", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 540, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-12T13:36:05Z"}
{"id": 1018, "parent_run_id": "d81b65a1ed20dd9c", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 883, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-12T13:36:06Z"}
{"id": 1019, "parent_run_id": "d709bd8ec8b2c4bd", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 913, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-12T13:36:06Z"}
{"id": 1020, "parent_run_id": "d709bd8ec8b2c4bd", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 752, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-12T13:36:07Z"}
{"id": 1021, "parent_run_id": "d709bd8ec8b2c4bd", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 598, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-12T13:36:08Z"}
{"id": 1022, "parent_run_id": "852317b59cc48997", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 682, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-12T13:36:08Z"}
{"id": 1023, "parent_run_id": "852317b59cc48997", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 740, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-12T13:36:09Z"}
{"id": 1024, "parent_run_id": "852317b59cc48997", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 784, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-12T13:36:10Z"}
{"id": 1025, "parent_run_id": "4031fceafb575913", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 813, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T13:36:11Z"}
{"id": 1026, "parent_run_id": "4031fceafb575913", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1422, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-12T13:36:12Z"}
{"id": 1027, "parent_run_id": "4031fceafb575913", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 610, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-12T13:36:13Z"}
{"id": 1028, "parent_run_id": "e45edaef19de21d9", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 2059, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T13:36:15Z"}
{"id": 1029, "parent_run_id": "e45edaef19de21d9", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1272, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-12T13:36:16Z"}
{"id": 1030, "parent_run_id": "e45edaef19de21d9", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 459, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-12T13:36:17Z"}
{"id": 1031, "parent_run_id": "74b8014aedb1546b", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 1341, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-12T13:36:18Z"}
{"id": 1032, "parent_run_id": "74b8014aedb1546b", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2111, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-12T13:36:20Z"}
{"id": 1033, "parent_run_id": "74b8014aedb1546b", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1183, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-12T13:36:21Z"}
{"id": 1034, "parent_run_id": "69631b5ca0482dfd", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 847, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T13:36:22Z"}
{"id": 1035, "parent_run_id": "69631b5ca0482dfd", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 1678, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-12T13:36:24Z"}
{"id": 1036, "parent_run_id": "69631b5ca0482dfd", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 988, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-12T13:36:25Z"}
{"id": 1037, "parent_run_id": "dbc00df5af63ae9c", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 992, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T13:36:26Z"}
{"id": 1038, "parent_run_id": "dbc00df5af63ae9c", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1552, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-12T13:36:27Z"}
{"id": 1039, "parent_run_id": "dbc00df5af63ae9c", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 647, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-12T13:36:28Z"}
{"id": 1040, "parent_run_id": "3f0c4795e2af116d", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 868, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-12T13:36:29Z"}
{"id": 1041, "parent_run_id": "3f0c4795e2af116d", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1703, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-12T13:36:31Z"}
{"id": 1042, "parent_run_id": "3f0c4795e2af116d", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 843, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-12T13:36:32Z"}
{"id": 1043, "parent_run_id": "e75615bc9d618ce1", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 1067, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-12T13:36:33Z"}
{"id": 1044, "parent_run_id": "725339ddd0d0b13e", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 1059, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-12T13:36:34Z"}
{"id": 1045, "parent_run_id": "dbcf26cee3f8816e", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 680, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T13:36:34Z"}
{"id": 1046, "parent_run_id": "c346752cf959c2b3", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 1033, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-12T13:36:35Z"}
{"id": 1047, "parent_run_id": "6ca8dbe3c9e43c54", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 907, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-12T13:36:36Z"}
{"id": 1048, "parent_run_id": "df3750fa69b23e61", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 1961, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-12T13:36:38Z"}
{"id": 1051, "parent_run_id": "b312fcd301e93528", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 1369, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-13T05:03:36Z"}
{"id": 1052, "parent_run_id": "dc05ed43237325cf", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 1219, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-13T05:03:37Z"}
{"id": 1053, "parent_run_id": "00c796b9f393cbcd", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 611, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-13T05:03:38Z"}
{"id": 1054, "parent_run_id": "7549084aa7a1c856", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 810, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-13T05:03:38Z"}
{"id": 1055, "parent_run_id": "7549084aa7a1c856", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 677, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-13T05:03:39Z"}
{"id": 1056, "parent_run_id": "7549084aa7a1c856", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1745, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-13T05:03:41Z"}
{"id": 1057, "parent_run_id": "f26aa6829aff6bb1", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 679, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-13T05:03:41Z"}
{"id": 1058, "parent_run_id": "f26aa6829aff6bb1", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 783, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-13T05:03:42Z"}
{"id": 1059, "parent_run_id": "f26aa6829aff6bb1", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 2555, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-13T05:03:45Z"}
{"id": 1060, "parent_run_id": "fd1f97c9ab033e1a", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 1806, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-13T05:03:47Z"}
{"id": 1061, "parent_run_id": "fd1f97c9ab033e1a", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Positive", "expected": "neutral", "correct": 0, "latency_ms": 3168, "input_tokens": 9, "output_tokens": 2, "cost_eur": 1.2749999999999999e-06, "error": null, "created_at": "2026-05-13T05:03:50Z"}
{"id": 1062, "parent_run_id": "fd1f97c9ab033e1a", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 1215, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-13T05:03:51Z"}
{"id": 1063, "parent_run_id": "25bd972743c7affc", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 1001, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-13T05:03:52Z"}
{"id": 1064, "parent_run_id": "25bd972743c7affc", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 650, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-13T05:03:53Z"}
{"id": 1065, "parent_run_id": "25bd972743c7affc", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 916, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-13T05:03:54Z"}
{"id": 1066, "parent_run_id": "a5fe9fd0cb14c248", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 1141, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-13T05:03:55Z"}
{"id": 1067, "parent_run_id": "a5fe9fd0cb14c248", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 595, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-13T05:03:55Z"}
{"id": 1068, "parent_run_id": "a5fe9fd0cb14c248", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 603, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-13T05:03:56Z"}
{"id": 1069, "parent_run_id": "eef055f8c0385523", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 792, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-13T05:03:57Z"}
{"id": 1070, "parent_run_id": "eef055f8c0385523", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 779, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-13T05:03:58Z"}
{"id": 1071, "parent_run_id": "eef055f8c0385523", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 658, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-13T05:03:58Z"}
{"id": 1072, "parent_run_id": "dbc640de0367d75c", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 888, "input_tokens": 10, "output_tokens": 1, "cost_eur": 3.75e-06, "error": null, "created_at": "2026-05-13T05:03:59Z"}
{"id": 1073, "parent_run_id": "dbc640de0367d75c", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 616, "input_tokens": 10, "output_tokens": 1, "cost_eur": 1.0500000000000001e-06, "error": null, "created_at": "2026-05-13T05:04:00Z"}
{"id": 1074, "parent_run_id": "dbc640de0367d75c", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]", "output_text": "en", "expected": "en", "correct": 1, "latency_ms": 920, "input_tokens": 10, "output_tokens": 1, "cost_eur": 2.1000000000000002e-06, "error": null, "created_at": "2026-05-13T05:04:01Z"}
{"id": 1075, "parent_run_id": "72d93e466fb43b14", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 717, "input_tokens": 11, "output_tokens": 1, "cost_eur": 4e-06, "error": null, "created_at": "2026-05-13T05:04:01Z"}
{"id": 1076, "parent_run_id": "72d93e466fb43b14", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 995, "input_tokens": 11, "output_tokens": 1, "cost_eur": 1.125e-06, "error": null, "created_at": "2026-05-13T05:04:02Z"}
{"id": 1077, "parent_run_id": "72d93e466fb43b14", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]", "output_text": "fr", "expected": "fr", "correct": 1, "latency_ms": 799, "input_tokens": 11, "output_tokens": 1, "cost_eur": 2.25e-06, "error": null, "created_at": "2026-05-13T05:04:03Z"}
{"id": 1078, "parent_run_id": "7961d8c5b60e562c", "task_class": "detect_language", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 834, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-13T05:04:04Z"}
{"id": 1079, "parent_run_id": "7961d8c5b60e562c", "task_class": "detect_language", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 604, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-13T05:04:05Z"}
{"id": 1080, "parent_run_id": "7961d8c5b60e562c", "task_class": "detect_language", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]", "output_text": "de", "expected": "de", "correct": 1, "latency_ms": 365, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-13T05:04:05Z"}
{"id": 1081, "parent_run_id": "3e82a6be19faec60", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 699, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-13T05:04:06Z"}
{"id": 1082, "parent_run_id": "3e82a6be19faec60", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 703, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-13T05:04:06Z"}
{"id": 1083, "parent_run_id": "3e82a6be19faec60", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 641, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-13T05:04:07Z"}
{"id": 1084, "parent_run_id": "f434bb6444421cd7", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 593, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-13T05:04:08Z"}
{"id": 1085, "parent_run_id": "f434bb6444421cd7", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 1081, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-13T05:04:09Z"}
{"id": 1086, "parent_run_id": "f434bb6444421cd7", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 467, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-13T05:04:09Z"}
{"id": 1087, "parent_run_id": "3e5a159a15cb9481", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 595, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-13T05:04:10Z"}
{"id": 1088, "parent_run_id": "3e5a159a15cb9481", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 2330, "input_tokens": 9, "output_tokens": 1, "cost_eur": 9.749999999999998e-07, "error": null, "created_at": "2026-05-13T05:04:12Z"}
{"id": 1089, "parent_run_id": "3e5a159a15cb9481", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Neutral", "expected": "neutral", "correct": 1, "latency_ms": 3390, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-13T05:04:16Z"}
{"id": 1090, "parent_run_id": "0dcaf16cc43ff8fc", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "positive", "expected": "positive", "correct": 1, "latency_ms": 658, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-13T05:04:16Z"}
{"id": 1091, "parent_run_id": "0dcaf16cc43ff8fc", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 1278, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-13T05:04:17Z"}
{"id": 1092, "parent_run_id": "0dcaf16cc43ff8fc", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]", "output_text": "Positive", "expected": "positive", "correct": 1, "latency_ms": 704, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-13T05:04:18Z"}
{"id": 1093, "parent_run_id": "9628d7920f88d377", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 761, "input_tokens": 12, "output_tokens": 2, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-13T05:04:19Z"}
{"id": 1094, "parent_run_id": "9628d7920f88d377", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "negative", "expected": "negative", "correct": 1, "latency_ms": 1298, "input_tokens": 12, "output_tokens": 2, "cost_eur": 1.5e-06, "error": null, "created_at": "2026-05-13T05:04:20Z"}
{"id": 1095, "parent_run_id": "9628d7920f88d377", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]", "output_text": "Negative", "expected": "negative", "correct": 1, "latency_ms": 523, "input_tokens": 12, "output_tokens": 2, "cost_eur": 3e-06, "error": null, "created_at": "2026-05-13T05:04:21Z"}
{"id": 1096, "parent_run_id": "7b94478bff0bbeaa", "task_class": "classify_sentiment", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 668, "input_tokens": 9, "output_tokens": 1, "cost_eur": 3.5e-06, "error": null, "created_at": "2026-05-13T05:04:21Z"}
{"id": 1097, "parent_run_id": "7b94478bff0bbeaa", "task_class": "classify_sentiment", "subtask_idx": 1, "provider": "gemini", "model_name": "gemini", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "Positive", "expected": "neutral", "correct": 0, "latency_ms": 3125, "input_tokens": 9, "output_tokens": 2, "cost_eur": 1.2749999999999999e-06, "error": null, "created_at": "2026-05-13T05:04:25Z"}
{"id": 1098, "parent_run_id": "7b94478bff0bbeaa", "task_class": "classify_sentiment", "subtask_idx": 2, "provider": "openai", "model_name": "openai", "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]", "output_text": "neutral", "expected": "neutral", "correct": 1, "latency_ms": 2682, "input_tokens": 9, "output_tokens": 1, "cost_eur": 1.9499999999999995e-06, "error": null, "created_at": "2026-05-13T05:04:27Z"}
{"id": 1099, "parent_run_id": "53b02ef085cccc69", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 739, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-13T05:04:28Z"}
{"id": 1100, "parent_run_id": "e613827564a117b4", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 812, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-13T05:04:29Z"}
{"id": 1101, "parent_run_id": "cdc2683114e00aeb", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 603, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-13T05:04:29Z"}
{"id": 1102, "parent_run_id": "30f56f4a848f636c", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]", "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]", "correct": 1, "latency_ms": 722, "input_tokens": 15, "output_tokens": 13, "cost_eur": 2e-05, "error": null, "created_at": "2026-05-13T05:04:30Z"}
{"id": 1103, "parent_run_id": "eed132185f667bd6", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]", "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[\"hello@astranl.com\"]", "correct": 1, "latency_ms": 849, "input_tokens": 9, "output_tokens": 8, "cost_eur": 1.225e-05, "error": null, "created_at": "2026-05-13T05:04:31Z"}
{"id": 1104, "parent_run_id": "b6306081392154e3", "task_class": "extract_emails", "subtask_idx": 0, "provider": "anthropic", "model_name": "anthropic", "input_text": "No emails in this text at all.... [sha256:126563e18796]", "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]", "expected": "[]", "correct": 1, "latency_ms": 1031, "input_tokens": 7, "output_tokens": 3, "cost_eur": 5.5e-06, "error": null, "created_at": "2026-05-13T05:04:32Z"}
