[
  {
    "id": 1,
    "parent_run_id": "569784d8605018c3",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you today friend... [sha256:4d080c4227e4]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 838,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-29T19:58:48Z"
  },
  {
    "id": 2,
    "parent_run_id": "569784d8605018c3",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you today friend... [sha256:4d080c4227e4]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 614,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-29T19:58:49Z"
  },
  {
    "id": 3,
    "parent_run_id": "569784d8605018c3",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you today friend... [sha256:4d080c4227e4]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 1899,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-29T19:58:51Z"
  },
  {
    "id": 4,
    "parent_run_id": "2302a774d4a3315e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I really love this restaurant the food was amazing... [sha256:6e7bb65413ec]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1344,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-29T19:59:04Z"
  },
  {
    "id": 5,
    "parent_run_id": "2302a774d4a3315e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I really love this restaurant the food was amazing... [sha256:6e7bb65413ec]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1435,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-29T19:59:06Z"
  },
  {
    "id": 6,
    "parent_run_id": "2302a774d4a3315e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I really love this restaurant the food was amazing... [sha256:6e7bb65413ec]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 3345,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-29T19:59:09Z"
  },
  {
    "id": 8,
    "parent_run_id": "e94044497284edf1",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 1099,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:17Z"
  },
  {
    "id": 9,
    "parent_run_id": "e94044497284edf1",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 655,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:18Z"
  },
  {
    "id": 10,
    "parent_run_id": "e94044497284edf1",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 724,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:19Z"
  },
  {
    "id": 11,
    "parent_run_id": "05c6aa064dd2e7a0",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 574,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:19Z"
  },
  {
    "id": 12,
    "parent_run_id": "05c6aa064dd2e7a0",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 932,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:20Z"
  },
  {
    "id": 13,
    "parent_run_id": "05c6aa064dd2e7a0",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 921,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:21Z"
  },
  {
    "id": 14,
    "parent_run_id": "32e48ed3f24ea2c1",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 689,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:22Z"
  },
  {
    "id": 15,
    "parent_run_id": "32e48ed3f24ea2c1",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 730,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-29T20:00:22Z"
  },
  {
    "id": 16,
    "parent_run_id": "32e48ed3f24ea2c1",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 767,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:23Z"
  },
  {
    "id": 17,
    "parent_run_id": "5d2ea7de89422385",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hola como estas hoy amigo mio... [sha256:bf779100908f]",
    "output_text": "es",
    "expected": "es",
    "correct": 1,
    "latency_ms": 1179,
    "input_tokens": 7,
    "output_tokens": 1,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:24Z"
  },
  {
    "id": 18,
    "parent_run_id": "5d2ea7de89422385",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hola como estas hoy amigo mio... [sha256:bf779100908f]",
    "output_text": "es",
    "expected": "es",
    "correct": 1,
    "latency_ms": 643,
    "input_tokens": 7,
    "output_tokens": 1,
    "cost_eur": 8.249999999999999e-07,
    "error": null,
    "created_at": "2026-04-29T20:00:25Z"
  },
  {
    "id": 19,
    "parent_run_id": "5d2ea7de89422385",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hola como estas hoy amigo mio... [sha256:bf779100908f]",
    "output_text": "es",
    "expected": "es",
    "correct": 1,
    "latency_ms": 652,
    "input_tokens": 7,
    "output_tokens": 1,
    "cost_eur": 1.6499999999999999e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:26Z"
  },
  {
    "id": 20,
    "parent_run_id": "e537c69770f0b8ea",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Привіт як справи сьогодні дорогий друже... [sha256:600c8ff1780c]",
    "output_text": "uk",
    "expected": "uk",
    "correct": 1,
    "latency_ms": 530,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:26Z"
  },
  {
    "id": 21,
    "parent_run_id": "e537c69770f0b8ea",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Привіт як справи сьогодні дорогий друже... [sha256:600c8ff1780c]",
    "output_text": "uk",
    "expected": "uk",
    "correct": 1,
    "latency_ms": 729,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-29T20:00:27Z"
  },
  {
    "id": 22,
    "parent_run_id": "e537c69770f0b8ea",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Привіт як справи сьогодні дорогий друже... [sha256:600c8ff1780c]",
    "output_text": "uk",
    "expected": "uk",
    "correct": 1,
    "latency_ms": 1575,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:29Z"
  },
  {
    "id": 23,
    "parent_run_id": "50a22d316f18cf47",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hoe gaat het met u vandaag mijn vriend... [sha256:3ecfbd873836]",
    "output_text": "nl",
    "expected": "nl",
    "correct": 1,
    "latency_ms": 684,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:29Z"
  },
  {
    "id": 24,
    "parent_run_id": "50a22d316f18cf47",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hoe gaat het met u vandaag mijn vriend... [sha256:3ecfbd873836]",
    "output_text": "nl",
    "expected": "nl",
    "correct": 1,
    "latency_ms": 712,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-29T20:00:30Z"
  },
  {
    "id": 25,
    "parent_run_id": "50a22d316f18cf47",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hoe gaat het met u vandaag mijn vriend... [sha256:3ecfbd873836]",
    "output_text": "nl",
    "expected": "nl",
    "correct": 1,
    "latency_ms": 1669,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:32Z"
  },
  {
    "id": 26,
    "parent_run_id": "94a0b7c186760859",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "你好今天过得怎么样朋友... [sha256:3d13851981d1]",
    "output_text": "zh",
    "expected": "zh",
    "correct": 1,
    "latency_ms": 782,
    "input_tokens": 2,
    "output_tokens": 1,
    "cost_eur": 1.75e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:32Z"
  },
  {
    "id": 27,
    "parent_run_id": "94a0b7c186760859",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "你好今天过得怎么样朋友... [sha256:3d13851981d1]",
    "output_text": "zh",
    "expected": "zh",
    "correct": 1,
    "latency_ms": 922,
    "input_tokens": 2,
    "output_tokens": 1,
    "cost_eur": 4.5e-07,
    "error": null,
    "created_at": "2026-04-29T20:00:33Z"
  },
  {
    "id": 28,
    "parent_run_id": "94a0b7c186760859",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "你好今天过得怎么样朋友... [sha256:3d13851981d1]",
    "output_text": "zh",
    "expected": "zh",
    "correct": 1,
    "latency_ms": 498,
    "input_tokens": 2,
    "output_tokens": 1,
    "cost_eur": 9e-07,
    "error": null,
    "created_at": "2026-04-29T20:00:34Z"
  },
  {
    "id": 29,
    "parent_run_id": "0c70d782b2f58231",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "こんにちは今日はどうですか友達... [sha256:46529f264bf3]",
    "output_text": "ja",
    "expected": "ja",
    "correct": 1,
    "latency_ms": 1134,
    "input_tokens": 3,
    "output_tokens": 1,
    "cost_eur": 2e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:35Z"
  },
  {
    "id": 30,
    "parent_run_id": "0c70d782b2f58231",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "こんにちは今日はどうですか友達... [sha256:46529f264bf3]",
    "output_text": "ja",
    "expected": "ja",
    "correct": 1,
    "latency_ms": 711,
    "input_tokens": 3,
    "output_tokens": 1,
    "cost_eur": 5.25e-07,
    "error": null,
    "created_at": "2026-04-29T20:00:36Z"
  },
  {
    "id": 31,
    "parent_run_id": "0c70d782b2f58231",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "こんにちは今日はどうですか友達... [sha256:46529f264bf3]",
    "output_text": "ja",
    "expected": "ja",
    "correct": 1,
    "latency_ms": 630,
    "input_tokens": 3,
    "output_tokens": 1,
    "cost_eur": 1.05e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:36Z"
  },
  {
    "id": 32,
    "parent_run_id": "fffea5f0c027c8f5",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 668,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:37Z"
  },
  {
    "id": 33,
    "parent_run_id": "fffea5f0c027c8f5",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 739,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:38Z"
  },
  {
    "id": 34,
    "parent_run_id": "fffea5f0c027c8f5",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 582,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:38Z"
  },
  {
    "id": 35,
    "parent_run_id": "07ef8841e44ea536",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 673,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:39Z"
  },
  {
    "id": 36,
    "parent_run_id": "07ef8841e44ea536",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 741,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:40Z"
  },
  {
    "id": 37,
    "parent_run_id": "07ef8841e44ea536",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1284,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:41Z"
  },
  {
    "id": 38,
    "parent_run_id": "9a106432baeaf861",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 744,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:42Z"
  },
  {
    "id": 39,
    "parent_run_id": "9a106432baeaf861",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2687,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-29T20:00:45Z"
  },
  {
    "id": 40,
    "parent_run_id": "9a106432baeaf861",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1098,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:46Z"
  },
  {
    "id": 41,
    "parent_run_id": "0edef7c530affbb4",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Best purchase I've made all year highly recommend... [sha256:0195cabc4f26]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 545,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:46Z"
  },
  {
    "id": 42,
    "parent_run_id": "0edef7c530affbb4",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Best purchase I've made all year highly recommend... [sha256:0195cabc4f26]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1505,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:48Z"
  },
  {
    "id": 43,
    "parent_run_id": "0edef7c530affbb4",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Best purchase I've made all year highly recommend... [sha256:0195cabc4f26]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 565,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:48Z"
  },
  {
    "id": 44,
    "parent_run_id": "01f4d3c1c7da7883",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Worst customer service ever do not buy from them... [sha256:b28f1fc6fa48]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 768,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:49Z"
  },
  {
    "id": 45,
    "parent_run_id": "01f4d3c1c7da7883",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Worst customer service ever do not buy from them... [sha256:b28f1fc6fa48]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1565,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:51Z"
  },
  {
    "id": 46,
    "parent_run_id": "01f4d3c1c7da7883",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Worst customer service ever do not buy from them... [sha256:b28f1fc6fa48]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 788,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:51Z"
  },
  {
    "id": 47,
    "parent_run_id": "d8a49ab8c7b6e594",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "It's an okay product nothing special... [sha256:b3ae3150c611]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 685,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:52Z"
  },
  {
    "id": 48,
    "parent_run_id": "d8a49ab8c7b6e594",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "It's an okay product nothing special... [sha256:b3ae3150c611]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2031,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-29T20:00:54Z"
  },
  {
    "id": 49,
    "parent_run_id": "d8a49ab8c7b6e594",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "It's an okay product nothing special... [sha256:b3ae3150c611]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 543,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:55Z"
  },
  {
    "id": 50,
    "parent_run_id": "3a00bfa5d27f1c9f",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Amazing quality and fast shipping very happy... [sha256:c1aec6b2c7ab]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 701,
    "input_tokens": 11,
    "output_tokens": 2,
    "cost_eur": 5.25e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:55Z"
  },
  {
    "id": 51,
    "parent_run_id": "3a00bfa5d27f1c9f",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Amazing quality and fast shipping very happy... [sha256:c1aec6b2c7ab]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1543,
    "input_tokens": 11,
    "output_tokens": 2,
    "cost_eur": 1.425e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:57Z"
  },
  {
    "id": 52,
    "parent_run_id": "3a00bfa5d27f1c9f",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Amazing quality and fast shipping very happy... [sha256:c1aec6b2c7ab]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 543,
    "input_tokens": 11,
    "output_tokens": 2,
    "cost_eur": 2.85e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:58Z"
  },
  {
    "id": 53,
    "parent_run_id": "0ca4f51008950c0e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Disappointed with the build quality breaks easily... [sha256:6ff0625c7dd9]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 784,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:00:58Z"
  },
  {
    "id": 54,
    "parent_run_id": "0ca4f51008950c0e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Disappointed with the build quality breaks easily... [sha256:6ff0625c7dd9]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1217,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:01:00Z"
  },
  {
    "id": 55,
    "parent_run_id": "0ca4f51008950c0e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Disappointed with the build quality breaks easily... [sha256:6ff0625c7dd9]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 5079,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-29T20:01:05Z"
  },
  {
    "id": 56,
    "parent_run_id": "ec1344e0b4909373",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 1257,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:13Z"
  },
  {
    "id": 57,
    "parent_run_id": "ec1344e0b4909373",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 707,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:13Z"
  },
  {
    "id": 58,
    "parent_run_id": "ec1344e0b4909373",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 689,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:14Z"
  },
  {
    "id": 59,
    "parent_run_id": "664b86f26994faa2",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 735,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:15Z"
  },
  {
    "id": 60,
    "parent_run_id": "664b86f26994faa2",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 1256,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:16Z"
  },
  {
    "id": 61,
    "parent_run_id": "664b86f26994faa2",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 838,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:17Z"
  },
  {
    "id": 62,
    "parent_run_id": "93ff4fced80ca0fa",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 701,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:18Z"
  },
  {
    "id": 63,
    "parent_run_id": "93ff4fced80ca0fa",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 1214,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-29T20:08:19Z"
  },
  {
    "id": 64,
    "parent_run_id": "93ff4fced80ca0fa",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 535,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:19Z"
  },
  {
    "id": 65,
    "parent_run_id": "ce6e905815e92e8c",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hola como estas hoy amigo mio... [sha256:bf779100908f]",
    "output_text": "es",
    "expected": "es",
    "correct": 1,
    "latency_ms": 647,
    "input_tokens": 7,
    "output_tokens": 1,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:20Z"
  },
  {
    "id": 66,
    "parent_run_id": "ce6e905815e92e8c",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hola como estas hoy amigo mio... [sha256:bf779100908f]",
    "output_text": "es",
    "expected": "es",
    "correct": 1,
    "latency_ms": 1384,
    "input_tokens": 7,
    "output_tokens": 1,
    "cost_eur": 8.249999999999999e-07,
    "error": null,
    "created_at": "2026-04-29T20:08:21Z"
  },
  {
    "id": 67,
    "parent_run_id": "ce6e905815e92e8c",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hola como estas hoy amigo mio... [sha256:bf779100908f]",
    "output_text": "es",
    "expected": "es",
    "correct": 1,
    "latency_ms": 655,
    "input_tokens": 7,
    "output_tokens": 1,
    "cost_eur": 1.6499999999999999e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:22Z"
  },
  {
    "id": 68,
    "parent_run_id": "c3a22b3921b646df",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Привіт як справи сьогодні дорогий друже... [sha256:600c8ff1780c]",
    "output_text": "uk",
    "expected": "uk",
    "correct": 1,
    "latency_ms": 685,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:23Z"
  },
  {
    "id": 69,
    "parent_run_id": "c3a22b3921b646df",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Привіт як справи сьогодні дорогий друже... [sha256:600c8ff1780c]",
    "output_text": "uk",
    "expected": "uk",
    "correct": 1,
    "latency_ms": 2440,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-29T20:08:25Z"
  },
  {
    "id": 70,
    "parent_run_id": "c3a22b3921b646df",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Привіт як справи сьогодні дорогий друже... [sha256:600c8ff1780c]",
    "output_text": "uk",
    "expected": "uk",
    "correct": 1,
    "latency_ms": 771,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:26Z"
  },
  {
    "id": 71,
    "parent_run_id": "13e301ea8d02670b",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hoe gaat het met u vandaag mijn vriend... [sha256:3ecfbd873836]",
    "output_text": "nl",
    "expected": "nl",
    "correct": 1,
    "latency_ms": 778,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:27Z"
  },
  {
    "id": 72,
    "parent_run_id": "13e301ea8d02670b",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hoe gaat het met u vandaag mijn vriend... [sha256:3ecfbd873836]",
    "output_text": "nl",
    "expected": "nl",
    "correct": 1,
    "latency_ms": 1633,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-29T20:08:28Z"
  },
  {
    "id": 73,
    "parent_run_id": "13e301ea8d02670b",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hoe gaat het met u vandaag mijn vriend... [sha256:3ecfbd873836]",
    "output_text": "nl",
    "expected": "nl",
    "correct": 1,
    "latency_ms": 553,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:29Z"
  },
  {
    "id": 74,
    "parent_run_id": "7b52928ba96c33e5",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "你好今天过得怎么样朋友... [sha256:3d13851981d1]",
    "output_text": "zh",
    "expected": "zh",
    "correct": 1,
    "latency_ms": 839,
    "input_tokens": 2,
    "output_tokens": 1,
    "cost_eur": 1.75e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:30Z"
  },
  {
    "id": 75,
    "parent_run_id": "7b52928ba96c33e5",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "你好今天过得怎么样朋友... [sha256:3d13851981d1]",
    "output_text": "zh",
    "expected": "zh",
    "correct": 1,
    "latency_ms": 1025,
    "input_tokens": 2,
    "output_tokens": 1,
    "cost_eur": 4.5e-07,
    "error": null,
    "created_at": "2026-04-29T20:08:31Z"
  },
  {
    "id": 76,
    "parent_run_id": "7b52928ba96c33e5",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "你好今天过得怎么样朋友... [sha256:3d13851981d1]",
    "output_text": "zh",
    "expected": "zh",
    "correct": 1,
    "latency_ms": 950,
    "input_tokens": 2,
    "output_tokens": 1,
    "cost_eur": 9e-07,
    "error": null,
    "created_at": "2026-04-29T20:08:32Z"
  },
  {
    "id": 77,
    "parent_run_id": "432df99b281bf0d2",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "こんにちは今日はどうですか友達... [sha256:46529f264bf3]",
    "output_text": "ja",
    "expected": "ja",
    "correct": 1,
    "latency_ms": 657,
    "input_tokens": 3,
    "output_tokens": 1,
    "cost_eur": 2e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:32Z"
  },
  {
    "id": 78,
    "parent_run_id": "432df99b281bf0d2",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "こんにちは今日はどうですか友達... [sha256:46529f264bf3]",
    "output_text": "ja",
    "expected": "ja",
    "correct": 1,
    "latency_ms": 1300,
    "input_tokens": 3,
    "output_tokens": 1,
    "cost_eur": 5.25e-07,
    "error": null,
    "created_at": "2026-04-29T20:08:34Z"
  },
  {
    "id": 79,
    "parent_run_id": "432df99b281bf0d2",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "こんにちは今日はどうですか友達... [sha256:46529f264bf3]",
    "output_text": "ja",
    "expected": "ja",
    "correct": 1,
    "latency_ms": 911,
    "input_tokens": 3,
    "output_tokens": 1,
    "cost_eur": 1.05e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:35Z"
  },
  {
    "id": 80,
    "parent_run_id": "4ef59567b86b0c49",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 685,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:35Z"
  },
  {
    "id": 81,
    "parent_run_id": "4ef59567b86b0c49",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 738,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:36Z"
  },
  {
    "id": 82,
    "parent_run_id": "4ef59567b86b0c49",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 734,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:37Z"
  },
  {
    "id": 83,
    "parent_run_id": "1f0ae896b944f838",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1197,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:38Z"
  },
  {
    "id": 84,
    "parent_run_id": "1f0ae896b944f838",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1123,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:39Z"
  },
  {
    "id": 85,
    "parent_run_id": "1f0ae896b944f838",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 638,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:40Z"
  },
  {
    "id": 86,
    "parent_run_id": "0923bd99ff5aab18",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 695,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:40Z"
  },
  {
    "id": 87,
    "parent_run_id": "0923bd99ff5aab18",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1644,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-29T20:08:42Z"
  },
  {
    "id": 88,
    "parent_run_id": "0923bd99ff5aab18",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 509,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:43Z"
  },
  {
    "id": 89,
    "parent_run_id": "c6d76954f935f0c3",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Best purchase I've made all year highly recommend... [sha256:0195cabc4f26]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1068,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:44Z"
  },
  {
    "id": 90,
    "parent_run_id": "c6d76954f935f0c3",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Best purchase I've made all year highly recommend... [sha256:0195cabc4f26]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1212,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:45Z"
  },
  {
    "id": 91,
    "parent_run_id": "c6d76954f935f0c3",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Best purchase I've made all year highly recommend... [sha256:0195cabc4f26]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1248,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:46Z"
  },
  {
    "id": 92,
    "parent_run_id": "7e9ddefae86b675b",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Worst customer service ever do not buy from them... [sha256:b28f1fc6fa48]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 688,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:47Z"
  },
  {
    "id": 93,
    "parent_run_id": "7e9ddefae86b675b",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Worst customer service ever do not buy from them... [sha256:b28f1fc6fa48]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 918,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:48Z"
  },
  {
    "id": 94,
    "parent_run_id": "7e9ddefae86b675b",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Worst customer service ever do not buy from them... [sha256:b28f1fc6fa48]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 588,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:48Z"
  },
  {
    "id": 95,
    "parent_run_id": "b41e9185c0867d9e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "It's an okay product nothing special... [sha256:b3ae3150c611]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 809,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:49Z"
  },
  {
    "id": 96,
    "parent_run_id": "b41e9185c0867d9e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "It's an okay product nothing special... [sha256:b3ae3150c611]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1462,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-29T20:08:51Z"
  },
  {
    "id": 97,
    "parent_run_id": "b41e9185c0867d9e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "It's an okay product nothing special... [sha256:b3ae3150c611]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 472,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:51Z"
  },
  {
    "id": 98,
    "parent_run_id": "25a0d93cb5e72fd8",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Amazing quality and fast shipping very happy... [sha256:c1aec6b2c7ab]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 481,
    "input_tokens": 11,
    "output_tokens": 2,
    "cost_eur": 5.25e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:52Z"
  },
  {
    "id": 99,
    "parent_run_id": "25a0d93cb5e72fd8",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Amazing quality and fast shipping very happy... [sha256:c1aec6b2c7ab]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 925,
    "input_tokens": 11,
    "output_tokens": 2,
    "cost_eur": 1.425e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:53Z"
  },
  {
    "id": 100,
    "parent_run_id": "25a0d93cb5e72fd8",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Amazing quality and fast shipping very happy... [sha256:c1aec6b2c7ab]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 909,
    "input_tokens": 11,
    "output_tokens": 2,
    "cost_eur": 2.85e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:53Z"
  },
  {
    "id": 101,
    "parent_run_id": "37f42aaa449acc66",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Disappointed with the build quality breaks easily... [sha256:6ff0625c7dd9]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1117,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:55Z"
  },
  {
    "id": 102,
    "parent_run_id": "37f42aaa449acc66",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Disappointed with the build quality breaks easily... [sha256:6ff0625c7dd9]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 830,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:55Z"
  },
  {
    "id": 103,
    "parent_run_id": "37f42aaa449acc66",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Disappointed with the build quality breaks easily... [sha256:6ff0625c7dd9]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 627,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:56Z"
  },
  {
    "id": 104,
    "parent_run_id": "a5a9b705bad1ddf1",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 804,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-04-29T20:08:57Z"
  },
  {
    "id": 105,
    "parent_run_id": "9674a9901a3acb26",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 620,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-04-29T20:08:58Z"
  },
  {
    "id": 106,
    "parent_run_id": "0d5c9963edc33d5e",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 688,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:08:58Z"
  },
  {
    "id": 109,
    "parent_run_id": "58f716fafc753cee",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 1133,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-04-29T20:09:32Z"
  },
  {
    "id": 110,
    "parent_run_id": "2f7f7337874c60d6",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 780,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-04-29T20:09:32Z"
  },
  {
    "id": 111,
    "parent_run_id": "b1f2379c878183d0",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 920,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-29T20:09:33Z"
  },
  {
    "id": 163,
    "parent_run_id": "c09e5aaa82d3a5c2",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1238,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:18Z"
  },
  {
    "id": 164,
    "parent_run_id": "c09e5aaa82d3a5c2",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1785,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:20Z"
  },
  {
    "id": 165,
    "parent_run_id": "c09e5aaa82d3a5c2",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1889,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:21Z"
  },
  {
    "id": 166,
    "parent_run_id": "5cd01907ecb5ab71",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 682,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:22Z"
  },
  {
    "id": 167,
    "parent_run_id": "5cd01907ecb5ab71",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1318,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:23Z"
  },
  {
    "id": 168,
    "parent_run_id": "5cd01907ecb5ab71",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 726,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:24Z"
  },
  {
    "id": 169,
    "parent_run_id": "5f801996834333cd",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 551,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:25Z"
  },
  {
    "id": 170,
    "parent_run_id": "5f801996834333cd",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2284,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-30T03:57:27Z"
  },
  {
    "id": 171,
    "parent_run_id": "5f801996834333cd",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 833,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:28Z"
  },
  {
    "id": 172,
    "parent_run_id": "f8071966fc082d1d",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 654,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:29Z"
  },
  {
    "id": 173,
    "parent_run_id": "f8071966fc082d1d",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 621,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:29Z"
  },
  {
    "id": 174,
    "parent_run_id": "f8071966fc082d1d",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 701,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:30Z"
  },
  {
    "id": 175,
    "parent_run_id": "7b592c04cec63660",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 671,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:31Z"
  },
  {
    "id": 176,
    "parent_run_id": "7b592c04cec63660",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 620,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:31Z"
  },
  {
    "id": 177,
    "parent_run_id": "7b592c04cec63660",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 490,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:32Z"
  },
  {
    "id": 178,
    "parent_run_id": "49df5566ec200f98",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 628,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:32Z"
  },
  {
    "id": 179,
    "parent_run_id": "49df5566ec200f98",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 575,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-30T03:57:33Z"
  },
  {
    "id": 180,
    "parent_run_id": "49df5566ec200f98",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 2250,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:35Z"
  },
  {
    "id": 181,
    "parent_run_id": "5c99f533b4ddc7c5",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 706,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-04-30T03:57:36Z"
  },
  {
    "id": 182,
    "parent_run_id": "da12cecb8bddffa2",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 673,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-04-30T03:57:37Z"
  },
  {
    "id": 183,
    "parent_run_id": "5d2591057eab2f18",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 698,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:37Z"
  },
  {
    "id": 184,
    "parent_run_id": "163d3748659dfe17",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 459,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:38Z"
  },
  {
    "id": 185,
    "parent_run_id": "163d3748659dfe17",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 513,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:38Z"
  },
  {
    "id": 186,
    "parent_run_id": "163d3748659dfe17",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 1470,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:40Z"
  },
  {
    "id": 187,
    "parent_run_id": "afd16d4d9c56a3ac",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 603,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:40Z"
  },
  {
    "id": 188,
    "parent_run_id": "afd16d4d9c56a3ac",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 659,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:41Z"
  },
  {
    "id": 189,
    "parent_run_id": "afd16d4d9c56a3ac",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 419,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:41Z"
  },
  {
    "id": 190,
    "parent_run_id": "56c37aa4132a570a",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 769,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:42Z"
  },
  {
    "id": 191,
    "parent_run_id": "56c37aa4132a570a",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 978,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-30T03:57:43Z"
  },
  {
    "id": 192,
    "parent_run_id": "56c37aa4132a570a",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 1406,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:45Z"
  },
  {
    "id": 193,
    "parent_run_id": "9ff49a2c51560b34",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 596,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:45Z"
  },
  {
    "id": 194,
    "parent_run_id": "9ff49a2c51560b34",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1366,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:47Z"
  },
  {
    "id": 195,
    "parent_run_id": "9ff49a2c51560b34",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 824,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:47Z"
  },
  {
    "id": 196,
    "parent_run_id": "dbd9714b10d44175",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 645,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:48Z"
  },
  {
    "id": 197,
    "parent_run_id": "dbd9714b10d44175",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 768,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:49Z"
  },
  {
    "id": 198,
    "parent_run_id": "dbd9714b10d44175",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 546,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:49Z"
  },
  {
    "id": 199,
    "parent_run_id": "0b4c8ac78f753d28",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 437,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:50Z"
  },
  {
    "id": 200,
    "parent_run_id": "0b4c8ac78f753d28",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2030,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-30T03:57:52Z"
  },
  {
    "id": 201,
    "parent_run_id": "0b4c8ac78f753d28",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 953,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:53Z"
  },
  {
    "id": 202,
    "parent_run_id": "7c1d84e0de0c892d",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 730,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:54Z"
  },
  {
    "id": 203,
    "parent_run_id": "7c1d84e0de0c892d",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1079,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:55Z"
  },
  {
    "id": 204,
    "parent_run_id": "7c1d84e0de0c892d",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 882,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:55Z"
  },
  {
    "id": 205,
    "parent_run_id": "5325c330ebb6d081",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 663,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:56Z"
  },
  {
    "id": 206,
    "parent_run_id": "5325c330ebb6d081",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 830,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:57Z"
  },
  {
    "id": 207,
    "parent_run_id": "5325c330ebb6d081",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 786,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:58Z"
  },
  {
    "id": 208,
    "parent_run_id": "d1ae73c0de4af741",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 467,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:57:58Z"
  },
  {
    "id": 209,
    "parent_run_id": "d1ae73c0de4af741",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1848,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-30T03:58:00Z"
  },
  {
    "id": 210,
    "parent_run_id": "d1ae73c0de4af741",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 570,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-30T03:58:01Z"
  },
  {
    "id": 211,
    "parent_run_id": "ee3688380110e8f5",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 712,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-04-30T03:58:01Z"
  },
  {
    "id": 212,
    "parent_run_id": "ba4150af1e444210",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 696,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-04-30T03:58:02Z"
  },
  {
    "id": 213,
    "parent_run_id": "0ead5a10d507a438",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 666,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:58:03Z"
  },
  {
    "id": 214,
    "parent_run_id": "77eedc90a745b043",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\n  \"alice@example.com\",\n  \"bob.smith@test.org\"\n]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 876,
    "input_tokens": 15,
    "output_tokens": 15,
    "cost_eur": 2.25e-05,
    "error": null,
    "created_at": "2026-04-30T03:58:04Z"
  },
  {
    "id": 215,
    "parent_run_id": "341b5fb21f215e13",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 590,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-04-30T03:58:04Z"
  },
  {
    "id": 216,
    "parent_run_id": "5fdd56cf16bf18ed",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 651,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T03:58:05Z"
  },
  {
    "id": 217,
    "parent_run_id": "b3e6999434c12f90",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1803,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:00Z"
  },
  {
    "id": 218,
    "parent_run_id": "b3e6999434c12f90",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 715,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:00Z"
  },
  {
    "id": 219,
    "parent_run_id": "b3e6999434c12f90",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 719,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:01Z"
  },
  {
    "id": 220,
    "parent_run_id": "69693f3b4b4eb469",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 778,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:02Z"
  },
  {
    "id": 221,
    "parent_run_id": "69693f3b4b4eb469",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1520,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:03Z"
  },
  {
    "id": 222,
    "parent_run_id": "69693f3b4b4eb469",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 723,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:04Z"
  },
  {
    "id": 223,
    "parent_run_id": "bf8e6fc6923a78e4",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 935,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:05Z"
  },
  {
    "id": 224,
    "parent_run_id": "bf8e6fc6923a78e4",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2364,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-30T05:01:08Z"
  },
  {
    "id": 225,
    "parent_run_id": "bf8e6fc6923a78e4",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 996,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:09Z"
  },
  {
    "id": 226,
    "parent_run_id": "da9e2d4be31deafc",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 662,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:09Z"
  },
  {
    "id": 227,
    "parent_run_id": "da9e2d4be31deafc",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 758,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:10Z"
  },
  {
    "id": 228,
    "parent_run_id": "da9e2d4be31deafc",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 748,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:11Z"
  },
  {
    "id": 229,
    "parent_run_id": "dc099b48b31646bb",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 641,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:11Z"
  },
  {
    "id": 230,
    "parent_run_id": "dc099b48b31646bb",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 837,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:12Z"
  },
  {
    "id": 231,
    "parent_run_id": "dc099b48b31646bb",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 788,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:13Z"
  },
  {
    "id": 232,
    "parent_run_id": "acc5b8b8426fc539",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 900,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:14Z"
  },
  {
    "id": 233,
    "parent_run_id": "acc5b8b8426fc539",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 951,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-30T05:01:15Z"
  },
  {
    "id": 234,
    "parent_run_id": "acc5b8b8426fc539",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 631,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:15Z"
  },
  {
    "id": 235,
    "parent_run_id": "e4c6a274897db81a",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 753,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-04-30T05:01:16Z"
  },
  {
    "id": 236,
    "parent_run_id": "8eaa5b511ba7ceb3",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 868,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-04-30T05:01:17Z"
  },
  {
    "id": 237,
    "parent_run_id": "260bced4c91a3626",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 920,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:18Z"
  },
  {
    "id": 238,
    "parent_run_id": "cdb006de647d8323",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 973,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:19Z"
  },
  {
    "id": 239,
    "parent_run_id": "cdb006de647d8323",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 825,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:20Z"
  },
  {
    "id": 240,
    "parent_run_id": "cdb006de647d8323",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 702,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:21Z"
  },
  {
    "id": 241,
    "parent_run_id": "382fec2a79835556",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 2711,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:23Z"
  },
  {
    "id": 242,
    "parent_run_id": "382fec2a79835556",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 917,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:24Z"
  },
  {
    "id": 243,
    "parent_run_id": "382fec2a79835556",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 442,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:25Z"
  },
  {
    "id": 244,
    "parent_run_id": "8696116792cbd76a",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 691,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:25Z"
  },
  {
    "id": 245,
    "parent_run_id": "8696116792cbd76a",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 617,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-30T05:01:26Z"
  },
  {
    "id": 246,
    "parent_run_id": "8696116792cbd76a",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 710,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:27Z"
  },
  {
    "id": 247,
    "parent_run_id": "22ec532678ff8f22",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 622,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:27Z"
  },
  {
    "id": 248,
    "parent_run_id": "22ec532678ff8f22",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1087,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:28Z"
  },
  {
    "id": 249,
    "parent_run_id": "22ec532678ff8f22",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 410,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:29Z"
  },
  {
    "id": 250,
    "parent_run_id": "1bbd931ee93144a9",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 662,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:29Z"
  },
  {
    "id": 251,
    "parent_run_id": "1bbd931ee93144a9",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1098,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:31Z"
  },
  {
    "id": 252,
    "parent_run_id": "1bbd931ee93144a9",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 629,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:31Z"
  },
  {
    "id": 253,
    "parent_run_id": "97adcbc6fabf19a9",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 634,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:32Z"
  },
  {
    "id": 254,
    "parent_run_id": "97adcbc6fabf19a9",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Positive",
    "expected": "neutral",
    "correct": 0,
    "latency_ms": 4161,
    "input_tokens": 9,
    "output_tokens": 2,
    "cost_eur": 1.2749999999999999e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:36Z"
  },
  {
    "id": 255,
    "parent_run_id": "97adcbc6fabf19a9",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2210,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:38Z"
  },
  {
    "id": 256,
    "parent_run_id": "12f0822948c8c417",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 608,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:39Z"
  },
  {
    "id": 257,
    "parent_run_id": "12f0822948c8c417",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1203,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:40Z"
  },
  {
    "id": 258,
    "parent_run_id": "12f0822948c8c417",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 385,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:40Z"
  },
  {
    "id": 259,
    "parent_run_id": "a145be8a15eeedfa",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 2690,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:43Z"
  },
  {
    "id": 260,
    "parent_run_id": "a145be8a15eeedfa",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1539,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:45Z"
  },
  {
    "id": 261,
    "parent_run_id": "a145be8a15eeedfa",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 534,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:45Z"
  },
  {
    "id": 262,
    "parent_run_id": "5310a92252d0f897",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 707,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:46Z"
  },
  {
    "id": 263,
    "parent_run_id": "5310a92252d0f897",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2646,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-04-30T05:01:49Z"
  },
  {
    "id": 264,
    "parent_run_id": "5310a92252d0f897",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 514,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:49Z"
  },
  {
    "id": 265,
    "parent_run_id": "1d5458b42eac071b",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 767,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-04-30T05:01:50Z"
  },
  {
    "id": 266,
    "parent_run_id": "bb34ce671346fd28",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 757,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-04-30T05:01:51Z"
  },
  {
    "id": 267,
    "parent_run_id": "b3f98870bf2a6386",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 765,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:51Z"
  },
  {
    "id": 268,
    "parent_run_id": "686efe1daaf6b507",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 851,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-04-30T05:01:52Z"
  },
  {
    "id": 269,
    "parent_run_id": "e2bda82e8acaa770",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 742,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-04-30T05:01:53Z"
  },
  {
    "id": 270,
    "parent_run_id": "eced7ec5717eeed3",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 663,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-04-30T05:01:54Z"
  },
  {
    "id": 271,
    "parent_run_id": "f5e08181dd53d420",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1390,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:20Z"
  },
  {
    "id": 272,
    "parent_run_id": "f5e08181dd53d420",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 745,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:21Z"
  },
  {
    "id": 273,
    "parent_run_id": "f5e08181dd53d420",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1562,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:22Z"
  },
  {
    "id": 274,
    "parent_run_id": "0b8d3a5acce62411",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 710,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:23Z"
  },
  {
    "id": 275,
    "parent_run_id": "0b8d3a5acce62411",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1272,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:24Z"
  },
  {
    "id": 276,
    "parent_run_id": "0b8d3a5acce62411",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 557,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:25Z"
  },
  {
    "id": 277,
    "parent_run_id": "d98866809761018e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 727,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:25Z"
  },
  {
    "id": 278,
    "parent_run_id": "d98866809761018e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2000,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-01T05:00:27Z"
  },
  {
    "id": 279,
    "parent_run_id": "d98866809761018e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 886,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:28Z"
  },
  {
    "id": 280,
    "parent_run_id": "4a2105df029d21c8",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 699,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:29Z"
  },
  {
    "id": 281,
    "parent_run_id": "4a2105df029d21c8",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 673,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:30Z"
  },
  {
    "id": 282,
    "parent_run_id": "4a2105df029d21c8",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 808,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:31Z"
  },
  {
    "id": 283,
    "parent_run_id": "89bd10524f4ad348",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 683,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:31Z"
  },
  {
    "id": 284,
    "parent_run_id": "89bd10524f4ad348",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 695,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:32Z"
  },
  {
    "id": 285,
    "parent_run_id": "89bd10524f4ad348",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 454,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:32Z"
  },
  {
    "id": 286,
    "parent_run_id": "7724143b111c3db7",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 860,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:33Z"
  },
  {
    "id": 287,
    "parent_run_id": "7724143b111c3db7",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 904,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-01T05:00:34Z"
  },
  {
    "id": 288,
    "parent_run_id": "7724143b111c3db7",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 1373,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:36Z"
  },
  {
    "id": 289,
    "parent_run_id": "79e8130e8c0f816e",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 796,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-01T05:00:36Z"
  },
  {
    "id": 290,
    "parent_run_id": "c65adee1e55ddcfa",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 733,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-01T05:00:37Z"
  },
  {
    "id": 291,
    "parent_run_id": "8be8d6cae651a103",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 1020,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:38Z"
  },
  {
    "id": 292,
    "parent_run_id": "6ccccbfc79c76e35",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 532,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:39Z"
  },
  {
    "id": 293,
    "parent_run_id": "6ccccbfc79c76e35",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 827,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:39Z"
  },
  {
    "id": 294,
    "parent_run_id": "6ccccbfc79c76e35",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 765,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:40Z"
  },
  {
    "id": 295,
    "parent_run_id": "0c47ced9d8d50e3f",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 749,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:41Z"
  },
  {
    "id": 296,
    "parent_run_id": "0c47ced9d8d50e3f",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 617,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:42Z"
  },
  {
    "id": 297,
    "parent_run_id": "0c47ced9d8d50e3f",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 844,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:42Z"
  },
  {
    "id": 298,
    "parent_run_id": "418cc3e07572bede",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 615,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:43Z"
  },
  {
    "id": 299,
    "parent_run_id": "418cc3e07572bede",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 941,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-01T05:00:44Z"
  },
  {
    "id": 300,
    "parent_run_id": "418cc3e07572bede",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 453,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:44Z"
  },
  {
    "id": 301,
    "parent_run_id": "335fbed6765f703d",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 909,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:45Z"
  },
  {
    "id": 302,
    "parent_run_id": "335fbed6765f703d",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 857,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:46Z"
  },
  {
    "id": 303,
    "parent_run_id": "335fbed6765f703d",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 601,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:47Z"
  },
  {
    "id": 304,
    "parent_run_id": "0e4707492261c26a",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 794,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:48Z"
  },
  {
    "id": 305,
    "parent_run_id": "0e4707492261c26a",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1341,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:49Z"
  },
  {
    "id": 306,
    "parent_run_id": "0e4707492261c26a",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 526,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:50Z"
  },
  {
    "id": 307,
    "parent_run_id": "1262a2b90563102e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 565,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:50Z"
  },
  {
    "id": 308,
    "parent_run_id": "1262a2b90563102e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2129,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-01T05:00:52Z"
  },
  {
    "id": 309,
    "parent_run_id": "1262a2b90563102e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 480,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:53Z"
  },
  {
    "id": 310,
    "parent_run_id": "e99ad07c936f352e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 710,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:53Z"
  },
  {
    "id": 311,
    "parent_run_id": "e99ad07c936f352e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1251,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:55Z"
  },
  {
    "id": 312,
    "parent_run_id": "e99ad07c936f352e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 412,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:55Z"
  },
  {
    "id": 313,
    "parent_run_id": "1d058112a46b915b",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 685,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:56Z"
  },
  {
    "id": 314,
    "parent_run_id": "1d058112a46b915b",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1014,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:57Z"
  },
  {
    "id": 315,
    "parent_run_id": "1d058112a46b915b",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 805,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-01T05:00:58Z"
  },
  {
    "id": 316,
    "parent_run_id": "46bb09449fa21a52",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2371,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:01:00Z"
  },
  {
    "id": 317,
    "parent_run_id": "46bb09449fa21a52",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2672,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-01T05:01:03Z"
  },
  {
    "id": 318,
    "parent_run_id": "46bb09449fa21a52",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 496,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-01T05:01:03Z"
  },
  {
    "id": 319,
    "parent_run_id": "95d57e27968cbf8d",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 775,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-01T05:01:04Z"
  },
  {
    "id": 320,
    "parent_run_id": "f4419a2f862019ac",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 760,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-01T05:01:05Z"
  },
  {
    "id": 321,
    "parent_run_id": "a21d1fcd10cbc612",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 717,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:01:06Z"
  },
  {
    "id": 322,
    "parent_run_id": "ea3ee2a70ce54be0",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 764,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-01T05:01:06Z"
  },
  {
    "id": 323,
    "parent_run_id": "f63d1aedbc32f13e",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 594,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-01T05:01:07Z"
  },
  {
    "id": 324,
    "parent_run_id": "fa26bb6eee780038",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 565,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-01T05:01:07Z"
  },
  {
    "id": 325,
    "parent_run_id": "a520bffc3fa0df51",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1480,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:03:50Z"
  },
  {
    "id": 326,
    "parent_run_id": "a520bffc3fa0df51",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 592,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:03:50Z"
  },
  {
    "id": 327,
    "parent_run_id": "a520bffc3fa0df51",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 870,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-02T05:03:51Z"
  },
  {
    "id": 328,
    "parent_run_id": "19be8f7f16f7698e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 918,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:03:52Z"
  },
  {
    "id": 329,
    "parent_run_id": "19be8f7f16f7698e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1184,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:03:53Z"
  },
  {
    "id": 330,
    "parent_run_id": "19be8f7f16f7698e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1209,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-02T05:03:54Z"
  },
  {
    "id": 331,
    "parent_run_id": "65f05a6600f33b96",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "positive",
    "expected": "neutral",
    "correct": 0,
    "latency_ms": 457,
    "input_tokens": 9,
    "output_tokens": 2,
    "cost_eur": 4.75e-06,
    "error": null,
    "created_at": "2026-05-02T05:03:55Z"
  },
  {
    "id": 332,
    "parent_run_id": "65f05a6600f33b96",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Positive",
    "expected": "neutral",
    "correct": 0,
    "latency_ms": 2602,
    "input_tokens": 9,
    "output_tokens": 2,
    "cost_eur": 1.2749999999999999e-06,
    "error": null,
    "created_at": "2026-05-02T05:03:57Z"
  },
  {
    "id": 333,
    "parent_run_id": "65f05a6600f33b96",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 557,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-02T05:03:58Z"
  },
  {
    "id": 334,
    "parent_run_id": "31f79c1b9f551bf0",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 833,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-02T05:03:59Z"
  },
  {
    "id": 335,
    "parent_run_id": "c9f3d1c37d29e47a",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 684,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-02T05:04:00Z"
  },
  {
    "id": 336,
    "parent_run_id": "0642c14ff1d01266",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 810,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:00Z"
  },
  {
    "id": 337,
    "parent_run_id": "d1be3a01c6a4d7e2",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 476,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:01Z"
  },
  {
    "id": 338,
    "parent_run_id": "d1be3a01c6a4d7e2",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 588,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:01Z"
  },
  {
    "id": 339,
    "parent_run_id": "d1be3a01c6a4d7e2",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 819,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:02Z"
  },
  {
    "id": 340,
    "parent_run_id": "937e65fa2bf26773",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 526,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:03Z"
  },
  {
    "id": 341,
    "parent_run_id": "937e65fa2bf26773",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 952,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:04Z"
  },
  {
    "id": 342,
    "parent_run_id": "937e65fa2bf26773",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 430,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:04Z"
  },
  {
    "id": 343,
    "parent_run_id": "fd03af78aa73fca4",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 708,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:05Z"
  },
  {
    "id": 344,
    "parent_run_id": "fd03af78aa73fca4",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 695,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-02T05:04:06Z"
  },
  {
    "id": 345,
    "parent_run_id": "fd03af78aa73fca4",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 708,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:06Z"
  },
  {
    "id": 346,
    "parent_run_id": "48bd8f99542a9ce2",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 713,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:07Z"
  },
  {
    "id": 347,
    "parent_run_id": "48bd8f99542a9ce2",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 686,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:08Z"
  },
  {
    "id": 348,
    "parent_run_id": "48bd8f99542a9ce2",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 842,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:09Z"
  },
  {
    "id": 349,
    "parent_run_id": "27335671ef9ac90e",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 714,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:09Z"
  },
  {
    "id": 350,
    "parent_run_id": "27335671ef9ac90e",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 2743,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:12Z"
  },
  {
    "id": 351,
    "parent_run_id": "27335671ef9ac90e",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 864,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:13Z"
  },
  {
    "id": 352,
    "parent_run_id": "5ef4043f6730fa37",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 456,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:13Z"
  },
  {
    "id": 353,
    "parent_run_id": "5ef4043f6730fa37",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 633,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-02T05:04:14Z"
  },
  {
    "id": 354,
    "parent_run_id": "5ef4043f6730fa37",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 1624,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:16Z"
  },
  {
    "id": 355,
    "parent_run_id": "40572696c5d1a62e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 527,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:16Z"
  },
  {
    "id": 356,
    "parent_run_id": "40572696c5d1a62e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 603,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:17Z"
  },
  {
    "id": 357,
    "parent_run_id": "40572696c5d1a62e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 435,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:17Z"
  },
  {
    "id": 358,
    "parent_run_id": "8708d3e09408a2a4",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 950,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:18Z"
  },
  {
    "id": 359,
    "parent_run_id": "8708d3e09408a2a4",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 2165,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:20Z"
  },
  {
    "id": 360,
    "parent_run_id": "8708d3e09408a2a4",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 966,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:21Z"
  },
  {
    "id": 361,
    "parent_run_id": "1554805766880ea9",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 967,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:22Z"
  },
  {
    "id": 362,
    "parent_run_id": "1554805766880ea9",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2228,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-02T05:04:25Z"
  },
  {
    "id": 363,
    "parent_run_id": "1554805766880ea9",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2202,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:27Z"
  },
  {
    "id": 364,
    "parent_run_id": "708e9140dc72751a",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1598,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:28Z"
  },
  {
    "id": 365,
    "parent_run_id": "708e9140dc72751a",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 973,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:29Z"
  },
  {
    "id": 366,
    "parent_run_id": "708e9140dc72751a",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 464,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:30Z"
  },
  {
    "id": 367,
    "parent_run_id": "a26fee4f295bd1cf",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 815,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:31Z"
  },
  {
    "id": 368,
    "parent_run_id": "a26fee4f295bd1cf",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1258,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:32Z"
  },
  {
    "id": 369,
    "parent_run_id": "a26fee4f295bd1cf",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 811,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:33Z"
  },
  {
    "id": 370,
    "parent_run_id": "3447094880117721",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 435,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:33Z"
  },
  {
    "id": 371,
    "parent_run_id": "3447094880117721",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2928,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-02T05:04:36Z"
  },
  {
    "id": 372,
    "parent_run_id": "3447094880117721",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 414,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:37Z"
  },
  {
    "id": 373,
    "parent_run_id": "385e47e66d7792de",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 909,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-02T05:04:37Z"
  },
  {
    "id": 374,
    "parent_run_id": "69b6b33263b58c7b",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 722,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-02T05:04:38Z"
  },
  {
    "id": 375,
    "parent_run_id": "a53b6cb3ba8b1794",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 724,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:39Z"
  },
  {
    "id": 376,
    "parent_run_id": "77dd92ef321fe0e5",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 736,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-02T05:04:40Z"
  },
  {
    "id": 377,
    "parent_run_id": "9698f371b6eda0aa",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 749,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-02T05:04:40Z"
  },
  {
    "id": 378,
    "parent_run_id": "2732284a37f76c99",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 606,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-02T05:04:41Z"
  },
  {
    "id": 379,
    "parent_run_id": "be7c06e0e38d7727",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1603,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:13Z"
  },
  {
    "id": 380,
    "parent_run_id": "be7c06e0e38d7727",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1197,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:14Z"
  },
  {
    "id": 381,
    "parent_run_id": "be7c06e0e38d7727",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 2160,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:16Z"
  },
  {
    "id": 382,
    "parent_run_id": "35ea294e7b5cd325",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 698,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:17Z"
  },
  {
    "id": 383,
    "parent_run_id": "35ea294e7b5cd325",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 729,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:17Z"
  },
  {
    "id": 384,
    "parent_run_id": "35ea294e7b5cd325",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 902,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:18Z"
  },
  {
    "id": 385,
    "parent_run_id": "25e47c93feb6a59e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 612,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:19Z"
  },
  {
    "id": 386,
    "parent_run_id": "25e47c93feb6a59e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 3966,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-03T05:01:23Z"
  },
  {
    "id": 387,
    "parent_run_id": "25e47c93feb6a59e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1747,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:25Z"
  },
  {
    "id": 388,
    "parent_run_id": "a0b9445bf3327626",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 678,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-03T05:01:25Z"
  },
  {
    "id": 389,
    "parent_run_id": "3adf3c4909a63302",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 779,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-03T05:01:26Z"
  },
  {
    "id": 390,
    "parent_run_id": "cd753c6788d62ffc",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 623,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:27Z"
  },
  {
    "id": 391,
    "parent_run_id": "64a194fee9b083c7",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 623,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:27Z"
  },
  {
    "id": 392,
    "parent_run_id": "64a194fee9b083c7",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 881,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:28Z"
  },
  {
    "id": 393,
    "parent_run_id": "64a194fee9b083c7",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 1614,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:30Z"
  },
  {
    "id": 394,
    "parent_run_id": "39331063492c10d6",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 458,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:30Z"
  },
  {
    "id": 395,
    "parent_run_id": "39331063492c10d6",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 642,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:31Z"
  },
  {
    "id": 396,
    "parent_run_id": "39331063492c10d6",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 474,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:31Z"
  },
  {
    "id": 397,
    "parent_run_id": "a9cfa975f6bf8333",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 457,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:32Z"
  },
  {
    "id": 398,
    "parent_run_id": "a9cfa975f6bf8333",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 685,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-03T05:01:33Z"
  },
  {
    "id": 399,
    "parent_run_id": "a9cfa975f6bf8333",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 716,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:33Z"
  },
  {
    "id": 400,
    "parent_run_id": "08648ea18ced865b",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 670,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:34Z"
  },
  {
    "id": 401,
    "parent_run_id": "08648ea18ced865b",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 549,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:35Z"
  },
  {
    "id": 402,
    "parent_run_id": "08648ea18ced865b",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 1002,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:36Z"
  },
  {
    "id": 403,
    "parent_run_id": "0a967a3f3dcc802a",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 606,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:36Z"
  },
  {
    "id": 404,
    "parent_run_id": "0a967a3f3dcc802a",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 759,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:37Z"
  },
  {
    "id": 405,
    "parent_run_id": "0a967a3f3dcc802a",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 458,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:37Z"
  },
  {
    "id": 406,
    "parent_run_id": "e78af948bfe0e40d",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 636,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:38Z"
  },
  {
    "id": 407,
    "parent_run_id": "e78af948bfe0e40d",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 683,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-03T05:01:39Z"
  },
  {
    "id": 408,
    "parent_run_id": "e78af948bfe0e40d",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 1052,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:40Z"
  },
  {
    "id": 409,
    "parent_run_id": "0ef3230faa8e67be",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 534,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:40Z"
  },
  {
    "id": 410,
    "parent_run_id": "0ef3230faa8e67be",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1126,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:42Z"
  },
  {
    "id": 411,
    "parent_run_id": "0ef3230faa8e67be",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 759,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:42Z"
  },
  {
    "id": 412,
    "parent_run_id": "10176a254af09444",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 675,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:43Z"
  },
  {
    "id": 413,
    "parent_run_id": "10176a254af09444",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1189,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:44Z"
  },
  {
    "id": 414,
    "parent_run_id": "10176a254af09444",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 637,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:45Z"
  },
  {
    "id": 415,
    "parent_run_id": "8c61d1db2abcecbc",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 671,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:46Z"
  },
  {
    "id": 416,
    "parent_run_id": "8c61d1db2abcecbc",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2300,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-03T05:01:48Z"
  },
  {
    "id": 417,
    "parent_run_id": "8c61d1db2abcecbc",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 528,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:48Z"
  },
  {
    "id": 418,
    "parent_run_id": "91c6066346700947",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 631,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:49Z"
  },
  {
    "id": 419,
    "parent_run_id": "91c6066346700947",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 993,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:50Z"
  },
  {
    "id": 420,
    "parent_run_id": "91c6066346700947",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 709,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:51Z"
  },
  {
    "id": 421,
    "parent_run_id": "ecfd379c6d20a8f7",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 609,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:51Z"
  },
  {
    "id": 422,
    "parent_run_id": "ecfd379c6d20a8f7",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1309,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:53Z"
  },
  {
    "id": 423,
    "parent_run_id": "ecfd379c6d20a8f7",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 649,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:53Z"
  },
  {
    "id": 424,
    "parent_run_id": "233e710412fc4d72",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 591,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:54Z"
  },
  {
    "id": 425,
    "parent_run_id": "233e710412fc4d72",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2045,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-03T05:01:56Z"
  },
  {
    "id": 426,
    "parent_run_id": "233e710412fc4d72",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 413,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:56Z"
  },
  {
    "id": 427,
    "parent_run_id": "6a92b9cf2d1e6b76",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 557,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-03T05:01:57Z"
  },
  {
    "id": 428,
    "parent_run_id": "8779fbed46a6517c",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 779,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-03T05:01:58Z"
  },
  {
    "id": 429,
    "parent_run_id": "1d4c31254469ca10",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 651,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:01:58Z"
  },
  {
    "id": 430,
    "parent_run_id": "edfb7921e1c94a2e",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 733,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-03T05:01:59Z"
  },
  {
    "id": 431,
    "parent_run_id": "fbdc14aecea9a5a2",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 872,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-03T05:02:00Z"
  },
  {
    "id": 432,
    "parent_run_id": "493224dc4f8830b9",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 680,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-03T05:02:01Z"
  },
  {
    "id": 433,
    "parent_run_id": "c3c1a8aec3c1fce7",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1508,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:35Z"
  },
  {
    "id": 434,
    "parent_run_id": "c3c1a8aec3c1fce7",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1055,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:37Z"
  },
  {
    "id": 435,
    "parent_run_id": "c3c1a8aec3c1fce7",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 580,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:37Z"
  },
  {
    "id": 436,
    "parent_run_id": "fea78e7b8d058865",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 673,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:38Z"
  },
  {
    "id": 437,
    "parent_run_id": "fea78e7b8d058865",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1422,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:39Z"
  },
  {
    "id": 438,
    "parent_run_id": "fea78e7b8d058865",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1219,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:40Z"
  },
  {
    "id": 439,
    "parent_run_id": "66b1af4f1517e878",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 748,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:41Z"
  },
  {
    "id": 440,
    "parent_run_id": "66b1af4f1517e878",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2399,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-04T05:01:44Z"
  },
  {
    "id": 441,
    "parent_run_id": "66b1af4f1517e878",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1837,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:45Z"
  },
  {
    "id": 442,
    "parent_run_id": "345cab077f770405",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 1118,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-04T05:01:47Z"
  },
  {
    "id": 443,
    "parent_run_id": "36498ba563fbc347",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 678,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-04T05:01:47Z"
  },
  {
    "id": 444,
    "parent_run_id": "0b0a23a9edf0a4ca",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 549,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:48Z"
  },
  {
    "id": 445,
    "parent_run_id": "1516ec6bc1db288d",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 637,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:48Z"
  },
  {
    "id": 446,
    "parent_run_id": "1516ec6bc1db288d",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 792,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:49Z"
  },
  {
    "id": 447,
    "parent_run_id": "1516ec6bc1db288d",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 844,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:50Z"
  },
  {
    "id": 448,
    "parent_run_id": "a13000c61ac2d2b5",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 648,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:51Z"
  },
  {
    "id": 449,
    "parent_run_id": "a13000c61ac2d2b5",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 774,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:52Z"
  },
  {
    "id": 450,
    "parent_run_id": "a13000c61ac2d2b5",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 853,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:52Z"
  },
  {
    "id": 451,
    "parent_run_id": "0898dd58ae520395",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 690,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:53Z"
  },
  {
    "id": 452,
    "parent_run_id": "0898dd58ae520395",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 611,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-04T05:01:54Z"
  },
  {
    "id": 453,
    "parent_run_id": "0898dd58ae520395",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 860,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:55Z"
  },
  {
    "id": 454,
    "parent_run_id": "923e666ee11f07df",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 722,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:55Z"
  },
  {
    "id": 455,
    "parent_run_id": "923e666ee11f07df",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 788,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:56Z"
  },
  {
    "id": 456,
    "parent_run_id": "923e666ee11f07df",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 466,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:57Z"
  },
  {
    "id": 457,
    "parent_run_id": "af838ab93aa3d044",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 628,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:57Z"
  },
  {
    "id": 458,
    "parent_run_id": "af838ab93aa3d044",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 1099,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:58Z"
  },
  {
    "id": 459,
    "parent_run_id": "af838ab93aa3d044",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 483,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:59Z"
  },
  {
    "id": 460,
    "parent_run_id": "a6b912ef230396a6",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 661,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:01:59Z"
  },
  {
    "id": 461,
    "parent_run_id": "a6b912ef230396a6",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 590,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-04T05:02:00Z"
  },
  {
    "id": 462,
    "parent_run_id": "a6b912ef230396a6",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 445,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:01Z"
  },
  {
    "id": 463,
    "parent_run_id": "153bf64b2719607c",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 849,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:01Z"
  },
  {
    "id": 464,
    "parent_run_id": "153bf64b2719607c",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1226,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:03Z"
  },
  {
    "id": 465,
    "parent_run_id": "153bf64b2719607c",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 364,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:03Z"
  },
  {
    "id": 466,
    "parent_run_id": "ae24ae06526fd053",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 715,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:04Z"
  },
  {
    "id": 467,
    "parent_run_id": "ae24ae06526fd053",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1452,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:05Z"
  },
  {
    "id": 468,
    "parent_run_id": "ae24ae06526fd053",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 871,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:06Z"
  },
  {
    "id": 469,
    "parent_run_id": "4958ea3abb1ca1d8",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 566,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:07Z"
  },
  {
    "id": 470,
    "parent_run_id": "4958ea3abb1ca1d8",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2621,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-04T05:02:09Z"
  },
  {
    "id": 471,
    "parent_run_id": "4958ea3abb1ca1d8",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1200,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:10Z"
  },
  {
    "id": 472,
    "parent_run_id": "d49733b20cfad736",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 515,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:11Z"
  },
  {
    "id": 473,
    "parent_run_id": "d49733b20cfad736",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 648,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:12Z"
  },
  {
    "id": 474,
    "parent_run_id": "d49733b20cfad736",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 354,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:12Z"
  },
  {
    "id": 475,
    "parent_run_id": "4fde0349fdf3092e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 467,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:12Z"
  },
  {
    "id": 476,
    "parent_run_id": "4fde0349fdf3092e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1228,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:14Z"
  },
  {
    "id": 477,
    "parent_run_id": "4fde0349fdf3092e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 632,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:14Z"
  },
  {
    "id": 478,
    "parent_run_id": "07db12f072c00b34",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 700,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:15Z"
  },
  {
    "id": 479,
    "parent_run_id": "07db12f072c00b34",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2253,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-04T05:02:17Z"
  },
  {
    "id": 480,
    "parent_run_id": "07db12f072c00b34",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 832,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:18Z"
  },
  {
    "id": 481,
    "parent_run_id": "ba4d41e1f477b00f",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 743,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-04T05:02:19Z"
  },
  {
    "id": 482,
    "parent_run_id": "3c556bf33f968afa",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 977,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-04T05:02:20Z"
  },
  {
    "id": 483,
    "parent_run_id": "eea52049a44500e8",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 539,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:20Z"
  },
  {
    "id": 484,
    "parent_run_id": "d8d761f3b4c91f0e",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 837,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-04T05:02:21Z"
  },
  {
    "id": 485,
    "parent_run_id": "805deca8ff617394",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 849,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-04T05:02:22Z"
  },
  {
    "id": 486,
    "parent_run_id": "7f243dea0c191a78",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 677,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-04T05:02:23Z"
  },
  {
    "id": 530,
    "parent_run_id": "101dad2a4b0a6e56",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 2207,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:04Z"
  },
  {
    "id": 531,
    "parent_run_id": "101dad2a4b0a6e56",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1245,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:06Z"
  },
  {
    "id": 532,
    "parent_run_id": "101dad2a4b0a6e56",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1062,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:07Z"
  },
  {
    "id": 533,
    "parent_run_id": "52e447619f3d2574",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 681,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:07Z"
  },
  {
    "id": 534,
    "parent_run_id": "52e447619f3d2574",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 957,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:08Z"
  },
  {
    "id": 535,
    "parent_run_id": "52e447619f3d2574",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 441,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:09Z"
  },
  {
    "id": 536,
    "parent_run_id": "e37fc0051818372a",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 892,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:10Z"
  },
  {
    "id": 537,
    "parent_run_id": "e37fc0051818372a",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2466,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-05T05:02:12Z"
  },
  {
    "id": 538,
    "parent_run_id": "e37fc0051818372a",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1696,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:14Z"
  },
  {
    "id": 539,
    "parent_run_id": "ec6c90078b2f3603",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 784,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-05T05:02:15Z"
  },
  {
    "id": 540,
    "parent_run_id": "f4724e7e2ae04f75",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 738,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-05T05:02:15Z"
  },
  {
    "id": 541,
    "parent_run_id": "6b8f336c753b21be",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 907,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:16Z"
  },
  {
    "id": 542,
    "parent_run_id": "d6e4d23223bfa930",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 991,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:17Z"
  },
  {
    "id": 543,
    "parent_run_id": "d6e4d23223bfa930",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 815,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:18Z"
  },
  {
    "id": 544,
    "parent_run_id": "d6e4d23223bfa930",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 646,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:19Z"
  },
  {
    "id": 545,
    "parent_run_id": "77a63bbcffa6fed4",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 646,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:19Z"
  },
  {
    "id": 546,
    "parent_run_id": "77a63bbcffa6fed4",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 903,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:20Z"
  },
  {
    "id": 547,
    "parent_run_id": "77a63bbcffa6fed4",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 779,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:21Z"
  },
  {
    "id": 548,
    "parent_run_id": "adf1b5ac8753f176",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 634,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:22Z"
  },
  {
    "id": 549,
    "parent_run_id": "adf1b5ac8753f176",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 564,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-05T05:02:22Z"
  },
  {
    "id": 550,
    "parent_run_id": "adf1b5ac8753f176",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 444,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:23Z"
  },
  {
    "id": 551,
    "parent_run_id": "986a4e4bb4286ade",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 870,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:24Z"
  },
  {
    "id": 552,
    "parent_run_id": "986a4e4bb4286ade",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 589,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:24Z"
  },
  {
    "id": 553,
    "parent_run_id": "986a4e4bb4286ade",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 794,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:25Z"
  },
  {
    "id": 554,
    "parent_run_id": "3bf275f5634283d3",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 735,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:26Z"
  },
  {
    "id": 555,
    "parent_run_id": "3bf275f5634283d3",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 672,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:26Z"
  },
  {
    "id": 556,
    "parent_run_id": "3bf275f5634283d3",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 578,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:27Z"
  },
  {
    "id": 557,
    "parent_run_id": "4dee8a74deab21ca",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 691,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:28Z"
  },
  {
    "id": 558,
    "parent_run_id": "4dee8a74deab21ca",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 809,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-05T05:02:28Z"
  },
  {
    "id": 559,
    "parent_run_id": "4dee8a74deab21ca",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 836,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:29Z"
  },
  {
    "id": 560,
    "parent_run_id": "aae94a15127df223",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 516,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:30Z"
  },
  {
    "id": 561,
    "parent_run_id": "aae94a15127df223",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1312,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:31Z"
  },
  {
    "id": 562,
    "parent_run_id": "aae94a15127df223",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1929,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:33Z"
  },
  {
    "id": 563,
    "parent_run_id": "17ca23de2a2e66f8",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 655,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:34Z"
  },
  {
    "id": 564,
    "parent_run_id": "17ca23de2a2e66f8",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1141,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:35Z"
  },
  {
    "id": 565,
    "parent_run_id": "17ca23de2a2e66f8",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 470,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:35Z"
  },
  {
    "id": 566,
    "parent_run_id": "b21a27608805ecdc",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 753,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:36Z"
  },
  {
    "id": 567,
    "parent_run_id": "b21a27608805ecdc",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Positive",
    "expected": "neutral",
    "correct": 0,
    "latency_ms": 3276,
    "input_tokens": 9,
    "output_tokens": 2,
    "cost_eur": 1.2749999999999999e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:39Z"
  },
  {
    "id": 568,
    "parent_run_id": "b21a27608805ecdc",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1022,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:40Z"
  },
  {
    "id": 569,
    "parent_run_id": "cd1f33b4f7ec411f",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 775,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:41Z"
  },
  {
    "id": 570,
    "parent_run_id": "cd1f33b4f7ec411f",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 882,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:42Z"
  },
  {
    "id": 571,
    "parent_run_id": "cd1f33b4f7ec411f",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 529,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:43Z"
  },
  {
    "id": 572,
    "parent_run_id": "0a8d88c66cd3b914",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 541,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:43Z"
  },
  {
    "id": 573,
    "parent_run_id": "0a8d88c66cd3b914",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1460,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:45Z"
  },
  {
    "id": 574,
    "parent_run_id": "0a8d88c66cd3b914",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 608,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:45Z"
  },
  {
    "id": 575,
    "parent_run_id": "c024123b2fda33b4",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 516,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:46Z"
  },
  {
    "id": 576,
    "parent_run_id": "c024123b2fda33b4",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2402,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-05T05:02:48Z"
  },
  {
    "id": 577,
    "parent_run_id": "c024123b2fda33b4",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 568,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:49Z"
  },
  {
    "id": 578,
    "parent_run_id": "2c81aec67081b8a1",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 1257,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-05T05:02:50Z"
  },
  {
    "id": 579,
    "parent_run_id": "bbb6a75166d6fb2b",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 705,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-05T05:02:51Z"
  },
  {
    "id": 580,
    "parent_run_id": "d3a9a87a6eafd907",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 724,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:52Z"
  },
  {
    "id": 581,
    "parent_run_id": "523538da10626f3b",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 772,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-05T05:02:52Z"
  },
  {
    "id": 582,
    "parent_run_id": "28e3d58e6d2c22f7",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 823,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-05T05:02:53Z"
  },
  {
    "id": 583,
    "parent_run_id": "d0e33be5e0233dcb",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 741,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-05T05:02:54Z"
  },
  {
    "id": 596,
    "parent_run_id": "656f848f7802fdcc",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1293,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:03:59Z"
  },
  {
    "id": 597,
    "parent_run_id": "656f848f7802fdcc",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1352,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:01Z"
  },
  {
    "id": 598,
    "parent_run_id": "656f848f7802fdcc",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1673,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:02Z"
  },
  {
    "id": 599,
    "parent_run_id": "e064533a105bcc73",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 852,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:03Z"
  },
  {
    "id": 600,
    "parent_run_id": "e064533a105bcc73",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1124,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:04Z"
  },
  {
    "id": 601,
    "parent_run_id": "e064533a105bcc73",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 930,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:05Z"
  },
  {
    "id": 602,
    "parent_run_id": "a330df5f5097082e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 642,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:06Z"
  },
  {
    "id": 603,
    "parent_run_id": "a330df5f5097082e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1609,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-06T05:04:08Z"
  },
  {
    "id": 604,
    "parent_run_id": "a330df5f5097082e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 379,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:08Z"
  },
  {
    "id": 605,
    "parent_run_id": "6872ba4f6841ad9c",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 775,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-06T05:04:09Z"
  },
  {
    "id": 606,
    "parent_run_id": "f87e7550aeed06b7",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 826,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-06T05:04:10Z"
  },
  {
    "id": 607,
    "parent_run_id": "dba76ef852eab36b",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 1665,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:11Z"
  },
  {
    "id": 608,
    "parent_run_id": "5547b2970c69aa03",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 662,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:12Z"
  },
  {
    "id": 609,
    "parent_run_id": "5547b2970c69aa03",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 801,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:13Z"
  },
  {
    "id": 610,
    "parent_run_id": "5547b2970c69aa03",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 750,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:14Z"
  },
  {
    "id": 611,
    "parent_run_id": "402407843237acb5",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 638,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:14Z"
  },
  {
    "id": 612,
    "parent_run_id": "402407843237acb5",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 622,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:15Z"
  },
  {
    "id": 613,
    "parent_run_id": "402407843237acb5",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 401,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:15Z"
  },
  {
    "id": 614,
    "parent_run_id": "97c0b9a19403d4a3",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 611,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:16Z"
  },
  {
    "id": 615,
    "parent_run_id": "97c0b9a19403d4a3",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 701,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-06T05:04:17Z"
  },
  {
    "id": 616,
    "parent_run_id": "97c0b9a19403d4a3",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 384,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:17Z"
  },
  {
    "id": 617,
    "parent_run_id": "230ff5967f9e40bc",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 623,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:18Z"
  },
  {
    "id": 618,
    "parent_run_id": "230ff5967f9e40bc",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 767,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:18Z"
  },
  {
    "id": 619,
    "parent_run_id": "230ff5967f9e40bc",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 448,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:19Z"
  },
  {
    "id": 620,
    "parent_run_id": "144ff3de8c2f0e19",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 929,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:20Z"
  },
  {
    "id": 621,
    "parent_run_id": "144ff3de8c2f0e19",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 564,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:20Z"
  },
  {
    "id": 622,
    "parent_run_id": "144ff3de8c2f0e19",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 386,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:21Z"
  },
  {
    "id": 623,
    "parent_run_id": "7d527d2453f0f8bb",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 894,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:22Z"
  },
  {
    "id": 624,
    "parent_run_id": "7d527d2453f0f8bb",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 655,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-06T05:04:22Z"
  },
  {
    "id": 625,
    "parent_run_id": "7d527d2453f0f8bb",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 771,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:23Z"
  },
  {
    "id": 626,
    "parent_run_id": "fc673e6c4ee2c8e1",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 635,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:24Z"
  },
  {
    "id": 627,
    "parent_run_id": "fc673e6c4ee2c8e1",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1086,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:25Z"
  },
  {
    "id": 628,
    "parent_run_id": "fc673e6c4ee2c8e1",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 422,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:25Z"
  },
  {
    "id": 629,
    "parent_run_id": "af3aa7a225f36e8e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 830,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:26Z"
  },
  {
    "id": 630,
    "parent_run_id": "af3aa7a225f36e8e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1103,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:27Z"
  },
  {
    "id": 631,
    "parent_run_id": "af3aa7a225f36e8e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 455,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:28Z"
  },
  {
    "id": 632,
    "parent_run_id": "dac1e16b0b7f6add",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 789,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:28Z"
  },
  {
    "id": 633,
    "parent_run_id": "dac1e16b0b7f6add",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2228,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-06T05:04:31Z"
  },
  {
    "id": 634,
    "parent_run_id": "dac1e16b0b7f6add",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 399,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:31Z"
  },
  {
    "id": 635,
    "parent_run_id": "7a130e52a8d1101d",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 638,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:32Z"
  },
  {
    "id": 636,
    "parent_run_id": "7a130e52a8d1101d",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 889,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:33Z"
  },
  {
    "id": 637,
    "parent_run_id": "7a130e52a8d1101d",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 502,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:33Z"
  },
  {
    "id": 638,
    "parent_run_id": "6a7d16a84ce48fa7",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 613,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:34Z"
  },
  {
    "id": 639,
    "parent_run_id": "6a7d16a84ce48fa7",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1933,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:36Z"
  },
  {
    "id": 640,
    "parent_run_id": "6a7d16a84ce48fa7",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1806,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:37Z"
  },
  {
    "id": 641,
    "parent_run_id": "bc8aef7ea797e824",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 639,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:38Z"
  },
  {
    "id": 642,
    "parent_run_id": "bc8aef7ea797e824",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2153,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-06T05:04:40Z"
  },
  {
    "id": 643,
    "parent_run_id": "bc8aef7ea797e824",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 785,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:41Z"
  },
  {
    "id": 644,
    "parent_run_id": "5ec8ef75570d2948",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 841,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-06T05:04:42Z"
  },
  {
    "id": 645,
    "parent_run_id": "df0218f7349a6dd7",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 819,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-06T05:04:43Z"
  },
  {
    "id": 646,
    "parent_run_id": "c465b919b3e345e5",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 663,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:43Z"
  },
  {
    "id": 647,
    "parent_run_id": "e1367e4bebbe2685",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 760,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-06T05:04:44Z"
  },
  {
    "id": 648,
    "parent_run_id": "d0443754612aa1fd",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 977,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-06T05:04:45Z"
  },
  {
    "id": 649,
    "parent_run_id": "5d4683fc121d2f92",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 833,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-06T05:04:46Z"
  },
  {
    "id": 653,
    "parent_run_id": "b23fb6ea5ef5bf42",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1488,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:26Z"
  },
  {
    "id": 654,
    "parent_run_id": "b23fb6ea5ef5bf42",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 632,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:27Z"
  },
  {
    "id": 655,
    "parent_run_id": "b23fb6ea5ef5bf42",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1834,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:28Z"
  },
  {
    "id": 656,
    "parent_run_id": "7d7053fff66c0ecf",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 776,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:29Z"
  },
  {
    "id": 657,
    "parent_run_id": "7d7053fff66c0ecf",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1091,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:30Z"
  },
  {
    "id": 658,
    "parent_run_id": "7d7053fff66c0ecf",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 571,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:31Z"
  },
  {
    "id": 659,
    "parent_run_id": "cccf378c12505681",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 661,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:32Z"
  },
  {
    "id": 660,
    "parent_run_id": "cccf378c12505681",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2483,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-07T05:04:34Z"
  },
  {
    "id": 661,
    "parent_run_id": "cccf378c12505681",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 473,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:35Z"
  },
  {
    "id": 662,
    "parent_run_id": "37ee1d4beb6cbe42",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 835,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-07T05:04:35Z"
  },
  {
    "id": 663,
    "parent_run_id": "10aaf4320b90d09b",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 681,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-07T05:04:36Z"
  },
  {
    "id": 664,
    "parent_run_id": "ab53bc9b50b3eeee",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 701,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:37Z"
  },
  {
    "id": 665,
    "parent_run_id": "c66ef0e298205d03",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 660,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:37Z"
  },
  {
    "id": 666,
    "parent_run_id": "c66ef0e298205d03",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 1055,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:38Z"
  },
  {
    "id": 667,
    "parent_run_id": "c66ef0e298205d03",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 457,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:39Z"
  },
  {
    "id": 668,
    "parent_run_id": "ce750f977a0b1e87",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 839,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:40Z"
  },
  {
    "id": 669,
    "parent_run_id": "ce750f977a0b1e87",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 888,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:41Z"
  },
  {
    "id": 670,
    "parent_run_id": "ce750f977a0b1e87",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 864,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:42Z"
  },
  {
    "id": 671,
    "parent_run_id": "04476896abf2cbd3",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 683,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:42Z"
  },
  {
    "id": 672,
    "parent_run_id": "04476896abf2cbd3",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 604,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-07T05:04:43Z"
  },
  {
    "id": 673,
    "parent_run_id": "04476896abf2cbd3",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 757,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:44Z"
  },
  {
    "id": 674,
    "parent_run_id": "0dbb9b94f19a3160",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 652,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:44Z"
  },
  {
    "id": 675,
    "parent_run_id": "0dbb9b94f19a3160",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 638,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:45Z"
  },
  {
    "id": 676,
    "parent_run_id": "0dbb9b94f19a3160",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 649,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:46Z"
  },
  {
    "id": 677,
    "parent_run_id": "d63e5f3b03884c21",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 1311,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:47Z"
  },
  {
    "id": 678,
    "parent_run_id": "d63e5f3b03884c21",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 983,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:48Z"
  },
  {
    "id": 679,
    "parent_run_id": "d63e5f3b03884c21",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 699,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:49Z"
  },
  {
    "id": 680,
    "parent_run_id": "e28a7359484c5fea",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 674,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:49Z"
  },
  {
    "id": 681,
    "parent_run_id": "e28a7359484c5fea",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 742,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-07T05:04:50Z"
  },
  {
    "id": 682,
    "parent_run_id": "e28a7359484c5fea",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 808,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:51Z"
  },
  {
    "id": 683,
    "parent_run_id": "4877dee45ff959e8",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 771,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:52Z"
  },
  {
    "id": 684,
    "parent_run_id": "4877dee45ff959e8",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1571,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:53Z"
  },
  {
    "id": 685,
    "parent_run_id": "4877dee45ff959e8",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 969,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:54Z"
  },
  {
    "id": 686,
    "parent_run_id": "da768ced46a8ade6",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 669,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:55Z"
  },
  {
    "id": 687,
    "parent_run_id": "da768ced46a8ade6",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1259,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:56Z"
  },
  {
    "id": 688,
    "parent_run_id": "da768ced46a8ade6",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 526,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:57Z"
  },
  {
    "id": 689,
    "parent_run_id": "59621747814f5902",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "positive",
    "expected": "neutral",
    "correct": 0,
    "latency_ms": 645,
    "input_tokens": 9,
    "output_tokens": 2,
    "cost_eur": 4.75e-06,
    "error": null,
    "created_at": "2026-05-07T05:04:57Z"
  },
  {
    "id": 690,
    "parent_run_id": "59621747814f5902",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2360,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-07T05:05:00Z"
  },
  {
    "id": 691,
    "parent_run_id": "59621747814f5902",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 974,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-07T05:05:01Z"
  },
  {
    "id": 692,
    "parent_run_id": "bfbced0c371d081e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 795,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:05:01Z"
  },
  {
    "id": 693,
    "parent_run_id": "bfbced0c371d081e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 738,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:05:02Z"
  },
  {
    "id": 694,
    "parent_run_id": "bfbced0c371d081e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 892,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-07T05:05:03Z"
  },
  {
    "id": 695,
    "parent_run_id": "aec50dc82dcb2ff2",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 772,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:05:04Z"
  },
  {
    "id": 696,
    "parent_run_id": "aec50dc82dcb2ff2",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1943,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:05:06Z"
  },
  {
    "id": 697,
    "parent_run_id": "aec50dc82dcb2ff2",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 687,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-07T05:05:07Z"
  },
  {
    "id": 698,
    "parent_run_id": "6e1ce94881136be3",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 879,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:05:07Z"
  },
  {
    "id": 699,
    "parent_run_id": "6e1ce94881136be3",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2175,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-07T05:05:10Z"
  },
  {
    "id": 700,
    "parent_run_id": "6e1ce94881136be3",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 608,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-07T05:05:10Z"
  },
  {
    "id": 701,
    "parent_run_id": "1b981dce399857d3",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 795,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-07T05:05:11Z"
  },
  {
    "id": 702,
    "parent_run_id": "4089bf3c0f979bcc",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 698,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-07T05:05:12Z"
  },
  {
    "id": 703,
    "parent_run_id": "06783117002f643c",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 714,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:05:12Z"
  },
  {
    "id": 704,
    "parent_run_id": "8b9f0fd9b41eaf5b",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 729,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-07T05:05:13Z"
  },
  {
    "id": 705,
    "parent_run_id": "64672631f9118eaa",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 717,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-07T05:05:14Z"
  },
  {
    "id": 706,
    "parent_run_id": "b0f65a11a8d36581",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 711,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-07T05:05:15Z"
  },
  {
    "id": 708,
    "parent_run_id": "c2ccddd55d8869af",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1541,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:18Z"
  },
  {
    "id": 709,
    "parent_run_id": "c2ccddd55d8869af",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 868,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:19Z"
  },
  {
    "id": 710,
    "parent_run_id": "c2ccddd55d8869af",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 3660,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:22Z"
  },
  {
    "id": 711,
    "parent_run_id": "c17c0c9b2622b3c9",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 676,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:23Z"
  },
  {
    "id": 712,
    "parent_run_id": "c17c0c9b2622b3c9",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 905,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:24Z"
  },
  {
    "id": 713,
    "parent_run_id": "c17c0c9b2622b3c9",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 566,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:25Z"
  },
  {
    "id": 714,
    "parent_run_id": "06420d6e72ec12ec",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 606,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:25Z"
  },
  {
    "id": 715,
    "parent_run_id": "06420d6e72ec12ec",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2209,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-08T05:00:27Z"
  },
  {
    "id": 716,
    "parent_run_id": "06420d6e72ec12ec",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1343,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:29Z"
  },
  {
    "id": 717,
    "parent_run_id": "b65476cc9aea3028",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 763,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-08T05:00:30Z"
  },
  {
    "id": 718,
    "parent_run_id": "046240bff7e3045d",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 690,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-08T05:00:30Z"
  },
  {
    "id": 719,
    "parent_run_id": "693beb7f2a21a9db",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 613,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:31Z"
  },
  {
    "id": 720,
    "parent_run_id": "ac262ba2a0c0dde0",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 646,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:32Z"
  },
  {
    "id": 721,
    "parent_run_id": "ac262ba2a0c0dde0",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 889,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:32Z"
  },
  {
    "id": 722,
    "parent_run_id": "ac262ba2a0c0dde0",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 1066,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:33Z"
  },
  {
    "id": 723,
    "parent_run_id": "bd2ef639e253c4d7",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 594,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:34Z"
  },
  {
    "id": 724,
    "parent_run_id": "bd2ef639e253c4d7",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 1110,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:35Z"
  },
  {
    "id": 725,
    "parent_run_id": "bd2ef639e253c4d7",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 523,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:36Z"
  },
  {
    "id": 726,
    "parent_run_id": "ed7f83fb06722847",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 598,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:36Z"
  },
  {
    "id": 727,
    "parent_run_id": "ed7f83fb06722847",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 965,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-08T05:00:37Z"
  },
  {
    "id": 728,
    "parent_run_id": "ed7f83fb06722847",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 2049,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:39Z"
  },
  {
    "id": 729,
    "parent_run_id": "9b96a189cccfde73",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 788,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:40Z"
  },
  {
    "id": 730,
    "parent_run_id": "9b96a189cccfde73",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 742,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:41Z"
  },
  {
    "id": 731,
    "parent_run_id": "9b96a189cccfde73",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 790,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:42Z"
  },
  {
    "id": 732,
    "parent_run_id": "c65c10c1a24dfff9",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 624,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:42Z"
  },
  {
    "id": 733,
    "parent_run_id": "c65c10c1a24dfff9",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 2057,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:44Z"
  },
  {
    "id": 734,
    "parent_run_id": "c65c10c1a24dfff9",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 1063,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:45Z"
  },
  {
    "id": 735,
    "parent_run_id": "7c8d859bec878e06",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 623,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:46Z"
  },
  {
    "id": 736,
    "parent_run_id": "7c8d859bec878e06",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 927,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-08T05:00:47Z"
  },
  {
    "id": 737,
    "parent_run_id": "7c8d859bec878e06",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 711,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:48Z"
  },
  {
    "id": 738,
    "parent_run_id": "c4ad8e2583fea550",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 778,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:49Z"
  },
  {
    "id": 739,
    "parent_run_id": "c4ad8e2583fea550",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1113,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:50Z"
  },
  {
    "id": 740,
    "parent_run_id": "c4ad8e2583fea550",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 2043,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:52Z"
  },
  {
    "id": 741,
    "parent_run_id": "9d33be8d5591bd25",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 649,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:52Z"
  },
  {
    "id": 742,
    "parent_run_id": "9d33be8d5591bd25",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 872,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:53Z"
  },
  {
    "id": 743,
    "parent_run_id": "9d33be8d5591bd25",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1044,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:54Z"
  },
  {
    "id": 744,
    "parent_run_id": "4782c16287865e37",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 668,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:55Z"
  },
  {
    "id": 745,
    "parent_run_id": "4782c16287865e37",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2262,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-08T05:00:57Z"
  },
  {
    "id": 746,
    "parent_run_id": "4782c16287865e37",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 945,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:58Z"
  },
  {
    "id": 747,
    "parent_run_id": "5d08f0d769b04ee8",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 612,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:00:59Z"
  },
  {
    "id": 748,
    "parent_run_id": "5d08f0d769b04ee8",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1270,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:01:00Z"
  },
  {
    "id": 749,
    "parent_run_id": "5d08f0d769b04ee8",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1396,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-08T05:01:01Z"
  },
  {
    "id": 750,
    "parent_run_id": "cf2d6994dcb90c0f",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 617,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:01:02Z"
  },
  {
    "id": 751,
    "parent_run_id": "cf2d6994dcb90c0f",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1003,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:01:03Z"
  },
  {
    "id": 752,
    "parent_run_id": "cf2d6994dcb90c0f",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 844,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-08T05:01:04Z"
  },
  {
    "id": 753,
    "parent_run_id": "e3e77e1578545682",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 615,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:01:05Z"
  },
  {
    "id": 754,
    "parent_run_id": "e3e77e1578545682",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2122,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-08T05:01:07Z"
  },
  {
    "id": 755,
    "parent_run_id": "e3e77e1578545682",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 522,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-08T05:01:07Z"
  },
  {
    "id": 756,
    "parent_run_id": "375bfc0eefde874e",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 722,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-08T05:01:08Z"
  },
  {
    "id": 757,
    "parent_run_id": "762038fcff7a56b7",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 675,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-08T05:01:09Z"
  },
  {
    "id": 758,
    "parent_run_id": "8c960c99042e947d",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 636,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:01:09Z"
  },
  {
    "id": 759,
    "parent_run_id": "cb3eb7fdf4a43f71",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 1341,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-08T05:01:11Z"
  },
  {
    "id": 760,
    "parent_run_id": "fa11fd352f754c1a",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 786,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-08T05:01:11Z"
  },
  {
    "id": 761,
    "parent_run_id": "f6d45c002eef9ae0",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 659,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-08T05:01:12Z"
  },
  {
    "id": 763,
    "parent_run_id": "aafab3c42313ff19",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1670,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:17Z"
  },
  {
    "id": 764,
    "parent_run_id": "aafab3c42313ff19",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1173,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:18Z"
  },
  {
    "id": 765,
    "parent_run_id": "aafab3c42313ff19",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 778,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:19Z"
  },
  {
    "id": 766,
    "parent_run_id": "64a0aa0158eb6527",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 798,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:20Z"
  },
  {
    "id": 767,
    "parent_run_id": "64a0aa0158eb6527",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1271,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:21Z"
  },
  {
    "id": 768,
    "parent_run_id": "64a0aa0158eb6527",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 2018,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:23Z"
  },
  {
    "id": 769,
    "parent_run_id": "c52aac67ea9920b1",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1298,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:24Z"
  },
  {
    "id": 770,
    "parent_run_id": "c52aac67ea9920b1",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2292,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-09T05:03:27Z"
  },
  {
    "id": 771,
    "parent_run_id": "c52aac67ea9920b1",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 914,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:28Z"
  },
  {
    "id": 772,
    "parent_run_id": "9e4ed8b730537870",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 1278,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-09T05:03:29Z"
  },
  {
    "id": 773,
    "parent_run_id": "78512cd3997159ad",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 1586,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-09T05:03:30Z"
  },
  {
    "id": 774,
    "parent_run_id": "96d7344b15892b2d",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 663,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:31Z"
  },
  {
    "id": 775,
    "parent_run_id": "4686e1f1de62e44f",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 686,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:32Z"
  },
  {
    "id": 776,
    "parent_run_id": "4686e1f1de62e44f",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 717,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:33Z"
  },
  {
    "id": 777,
    "parent_run_id": "4686e1f1de62e44f",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 736,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:33Z"
  },
  {
    "id": 778,
    "parent_run_id": "0749e122b44b451c",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 785,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:34Z"
  },
  {
    "id": 779,
    "parent_run_id": "0749e122b44b451c",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 666,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:35Z"
  },
  {
    "id": 780,
    "parent_run_id": "0749e122b44b451c",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 1793,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:37Z"
  },
  {
    "id": 781,
    "parent_run_id": "07c0a3bb57867582",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 680,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:37Z"
  },
  {
    "id": 782,
    "parent_run_id": "07c0a3bb57867582",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 578,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-09T05:03:38Z"
  },
  {
    "id": 783,
    "parent_run_id": "07c0a3bb57867582",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 555,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:38Z"
  },
  {
    "id": 784,
    "parent_run_id": "de371a21f9818771",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 652,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:39Z"
  },
  {
    "id": 785,
    "parent_run_id": "de371a21f9818771",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 721,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:40Z"
  },
  {
    "id": 786,
    "parent_run_id": "de371a21f9818771",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 722,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:40Z"
  },
  {
    "id": 787,
    "parent_run_id": "0dd6fae03dd5a412",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 1102,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:42Z"
  },
  {
    "id": 788,
    "parent_run_id": "0dd6fae03dd5a412",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 720,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:42Z"
  },
  {
    "id": 789,
    "parent_run_id": "0dd6fae03dd5a412",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 532,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:43Z"
  },
  {
    "id": 790,
    "parent_run_id": "9271d0ed4dd064f7",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 1036,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:44Z"
  },
  {
    "id": 791,
    "parent_run_id": "9271d0ed4dd064f7",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 711,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-09T05:03:45Z"
  },
  {
    "id": 792,
    "parent_run_id": "9271d0ed4dd064f7",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 946,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:46Z"
  },
  {
    "id": 793,
    "parent_run_id": "a2ce02a02ca34a17",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 923,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:46Z"
  },
  {
    "id": 794,
    "parent_run_id": "a2ce02a02ca34a17",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1430,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:48Z"
  },
  {
    "id": 795,
    "parent_run_id": "a2ce02a02ca34a17",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 480,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:48Z"
  },
  {
    "id": 796,
    "parent_run_id": "9f585d6ffae97b78",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 827,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:49Z"
  },
  {
    "id": 797,
    "parent_run_id": "9f585d6ffae97b78",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1279,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:51Z"
  },
  {
    "id": 798,
    "parent_run_id": "9f585d6ffae97b78",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 557,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:51Z"
  },
  {
    "id": 799,
    "parent_run_id": "d332f066444833db",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 606,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:52Z"
  },
  {
    "id": 800,
    "parent_run_id": "d332f066444833db",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2079,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-09T05:03:54Z"
  },
  {
    "id": 801,
    "parent_run_id": "d332f066444833db",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 847,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:55Z"
  },
  {
    "id": 802,
    "parent_run_id": "679dba45daa8c116",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 888,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:56Z"
  },
  {
    "id": 803,
    "parent_run_id": "679dba45daa8c116",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 622,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:56Z"
  },
  {
    "id": 804,
    "parent_run_id": "679dba45daa8c116",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 487,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:57Z"
  },
  {
    "id": 805,
    "parent_run_id": "75f29641a4261600",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 709,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:57Z"
  },
  {
    "id": 806,
    "parent_run_id": "75f29641a4261600",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1334,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:59Z"
  },
  {
    "id": 807,
    "parent_run_id": "75f29641a4261600",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 570,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-09T05:03:59Z"
  },
  {
    "id": 808,
    "parent_run_id": "3adef3a855801596",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 732,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:04:00Z"
  },
  {
    "id": 809,
    "parent_run_id": "3adef3a855801596",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 3112,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-09T05:04:03Z"
  },
  {
    "id": 810,
    "parent_run_id": "3adef3a855801596",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 599,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-09T05:04:04Z"
  },
  {
    "id": 811,
    "parent_run_id": "d9907e7bed558478",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 716,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-09T05:04:04Z"
  },
  {
    "id": 812,
    "parent_run_id": "cc1b32f177cb2213",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 694,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-09T05:04:05Z"
  },
  {
    "id": 813,
    "parent_run_id": "82ee0107488c9a9f",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 920,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:04:06Z"
  },
  {
    "id": 814,
    "parent_run_id": "c997aeeca36bd566",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 784,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-09T05:04:07Z"
  },
  {
    "id": 815,
    "parent_run_id": "8b6d8d889e17558e",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 784,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-09T05:04:08Z"
  },
  {
    "id": 816,
    "parent_run_id": "c3edffeb9e571994",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 740,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-09T05:04:08Z"
  },
  {
    "id": 818,
    "parent_run_id": "6a914f9d8cca88e6",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1369,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:01Z"
  },
  {
    "id": 819,
    "parent_run_id": "6a914f9d8cca88e6",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 758,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:02Z"
  },
  {
    "id": 820,
    "parent_run_id": "6a914f9d8cca88e6",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1006,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:03Z"
  },
  {
    "id": 821,
    "parent_run_id": "a352c75767bc39cb",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1305,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:04Z"
  },
  {
    "id": 822,
    "parent_run_id": "a352c75767bc39cb",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 643,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:05Z"
  },
  {
    "id": 823,
    "parent_run_id": "a352c75767bc39cb",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 420,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:05Z"
  },
  {
    "id": 824,
    "parent_run_id": "59b0be8c21d919d0",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 703,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:06Z"
  },
  {
    "id": 825,
    "parent_run_id": "59b0be8c21d919d0",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2294,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-10T05:03:08Z"
  },
  {
    "id": 826,
    "parent_run_id": "59b0be8c21d919d0",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2687,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:11Z"
  },
  {
    "id": 827,
    "parent_run_id": "69c54d6216ef4f4d",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 747,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-10T05:03:11Z"
  },
  {
    "id": 828,
    "parent_run_id": "77c723c96163d2c3",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 654,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-10T05:03:12Z"
  },
  {
    "id": 829,
    "parent_run_id": "7dc85c8f173fb5bc",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 750,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:13Z"
  },
  {
    "id": 830,
    "parent_run_id": "bab84406919424ee",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 657,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:13Z"
  },
  {
    "id": 831,
    "parent_run_id": "bab84406919424ee",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 557,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:14Z"
  },
  {
    "id": 832,
    "parent_run_id": "bab84406919424ee",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 1187,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:15Z"
  },
  {
    "id": 833,
    "parent_run_id": "b8204a65909500cd",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 611,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:16Z"
  },
  {
    "id": 834,
    "parent_run_id": "b8204a65909500cd",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 662,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:17Z"
  },
  {
    "id": 835,
    "parent_run_id": "b8204a65909500cd",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 605,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:17Z"
  },
  {
    "id": 836,
    "parent_run_id": "6527c6c7ebd1dccf",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 610,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:18Z"
  },
  {
    "id": 837,
    "parent_run_id": "6527c6c7ebd1dccf",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 1470,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-10T05:03:19Z"
  },
  {
    "id": 838,
    "parent_run_id": "6527c6c7ebd1dccf",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 880,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:20Z"
  },
  {
    "id": 839,
    "parent_run_id": "748f34e901ae4e42",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 595,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:21Z"
  },
  {
    "id": 840,
    "parent_run_id": "748f34e901ae4e42",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 530,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:21Z"
  },
  {
    "id": 841,
    "parent_run_id": "748f34e901ae4e42",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 797,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:22Z"
  },
  {
    "id": 842,
    "parent_run_id": "b1ced658b3ae8b45",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 1268,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:23Z"
  },
  {
    "id": 843,
    "parent_run_id": "b1ced658b3ae8b45",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 616,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:24Z"
  },
  {
    "id": 844,
    "parent_run_id": "b1ced658b3ae8b45",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 866,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:25Z"
  },
  {
    "id": 845,
    "parent_run_id": "8ad5bd4453b3439b",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 634,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:25Z"
  },
  {
    "id": 846,
    "parent_run_id": "8ad5bd4453b3439b",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 1960,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-10T05:03:27Z"
  },
  {
    "id": 847,
    "parent_run_id": "8ad5bd4453b3439b",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 399,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:28Z"
  },
  {
    "id": 848,
    "parent_run_id": "1a1cb93efc3c6727",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 658,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:28Z"
  },
  {
    "id": 849,
    "parent_run_id": "1a1cb93efc3c6727",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1068,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:30Z"
  },
  {
    "id": 850,
    "parent_run_id": "1a1cb93efc3c6727",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 605,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:30Z"
  },
  {
    "id": 851,
    "parent_run_id": "9611c8f8b823d318",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 630,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:31Z"
  },
  {
    "id": 852,
    "parent_run_id": "9611c8f8b823d318",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 648,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:31Z"
  },
  {
    "id": 853,
    "parent_run_id": "9611c8f8b823d318",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 498,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:32Z"
  },
  {
    "id": 854,
    "parent_run_id": "a60619d58120c816",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 611,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:33Z"
  },
  {
    "id": 855,
    "parent_run_id": "a60619d58120c816",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2218,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-10T05:03:35Z"
  },
  {
    "id": 856,
    "parent_run_id": "a60619d58120c816",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1332,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:36Z"
  },
  {
    "id": 857,
    "parent_run_id": "4a8d4996d6c0cff0",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 768,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:37Z"
  },
  {
    "id": 858,
    "parent_run_id": "4a8d4996d6c0cff0",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1062,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:38Z"
  },
  {
    "id": 859,
    "parent_run_id": "4a8d4996d6c0cff0",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1082,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:39Z"
  },
  {
    "id": 860,
    "parent_run_id": "fbfde6b8b396f919",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 739,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:40Z"
  },
  {
    "id": 861,
    "parent_run_id": "fbfde6b8b396f919",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1067,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:41Z"
  },
  {
    "id": 862,
    "parent_run_id": "fbfde6b8b396f919",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 568,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:41Z"
  },
  {
    "id": 863,
    "parent_run_id": "ff6b74d6dbaeb2ca",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 608,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:42Z"
  },
  {
    "id": 864,
    "parent_run_id": "ff6b74d6dbaeb2ca",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2202,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-10T05:03:44Z"
  },
  {
    "id": 865,
    "parent_run_id": "ff6b74d6dbaeb2ca",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1261,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:46Z"
  },
  {
    "id": 866,
    "parent_run_id": "099e67b1e4d567d6",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 781,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-10T05:03:46Z"
  },
  {
    "id": 867,
    "parent_run_id": "c6b2d0480f4555ac",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 2604,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-10T05:03:49Z"
  },
  {
    "id": 868,
    "parent_run_id": "58bebf714fc488a8",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 1238,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:50Z"
  },
  {
    "id": 869,
    "parent_run_id": "a227e0ac170f6c2f",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 714,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-10T05:03:51Z"
  },
  {
    "id": 870,
    "parent_run_id": "669f6e3d58bfd019",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 690,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-10T05:03:52Z"
  },
  {
    "id": 871,
    "parent_run_id": "8880360844921eda",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 1147,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-10T05:03:53Z"
  },
  {
    "id": 878,
    "parent_run_id": "8feee85ac427c5f3",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 2035,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:02:43Z"
  },
  {
    "id": 879,
    "parent_run_id": "8feee85ac427c5f3",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 939,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:02:44Z"
  },
  {
    "id": 880,
    "parent_run_id": "8feee85ac427c5f3",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1154,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-11T05:02:45Z"
  },
  {
    "id": 881,
    "parent_run_id": "ff59938cbe27aead",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 859,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:02:46Z"
  },
  {
    "id": 882,
    "parent_run_id": "ff59938cbe27aead",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1199,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:02:47Z"
  },
  {
    "id": 883,
    "parent_run_id": "ff59938cbe27aead",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 830,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-11T05:02:48Z"
  },
  {
    "id": 884,
    "parent_run_id": "7f8e99a52556948e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 752,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:02:48Z"
  },
  {
    "id": 885,
    "parent_run_id": "7f8e99a52556948e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2664,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-11T05:02:51Z"
  },
  {
    "id": 886,
    "parent_run_id": "7f8e99a52556948e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2126,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-11T05:02:53Z"
  },
  {
    "id": 887,
    "parent_run_id": "80c37939ba9c927a",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 905,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-11T05:02:54Z"
  },
  {
    "id": 888,
    "parent_run_id": "4bfe240f29d1e486",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 914,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-11T05:02:55Z"
  },
  {
    "id": 889,
    "parent_run_id": "e38d0949cccfe3b0",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 668,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:02:56Z"
  },
  {
    "id": 890,
    "parent_run_id": "406f210794807560",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 732,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-11T05:02:57Z"
  },
  {
    "id": 891,
    "parent_run_id": "406f210794807560",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 634,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-11T05:02:57Z"
  },
  {
    "id": 892,
    "parent_run_id": "406f210794807560",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 1074,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-11T05:02:58Z"
  },
  {
    "id": 893,
    "parent_run_id": "520dd61766d2b7e9",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 703,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-11T05:02:59Z"
  },
  {
    "id": 894,
    "parent_run_id": "520dd61766d2b7e9",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 627,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:00Z"
  },
  {
    "id": 895,
    "parent_run_id": "520dd61766d2b7e9",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 1892,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:01Z"
  },
  {
    "id": 896,
    "parent_run_id": "7bb5abe1bf1cd4b4",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 869,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:02Z"
  },
  {
    "id": 897,
    "parent_run_id": "7bb5abe1bf1cd4b4",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 931,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-11T05:03:03Z"
  },
  {
    "id": 898,
    "parent_run_id": "7bb5abe1bf1cd4b4",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 1214,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:05Z"
  },
  {
    "id": 899,
    "parent_run_id": "e10de88337ff32e4",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 606,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:05Z"
  },
  {
    "id": 900,
    "parent_run_id": "e10de88337ff32e4",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 577,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:06Z"
  },
  {
    "id": 901,
    "parent_run_id": "e10de88337ff32e4",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 743,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:06Z"
  },
  {
    "id": 902,
    "parent_run_id": "12fe85eb1a201abc",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 685,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:07Z"
  },
  {
    "id": 903,
    "parent_run_id": "12fe85eb1a201abc",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 1108,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:08Z"
  },
  {
    "id": 904,
    "parent_run_id": "12fe85eb1a201abc",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 959,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:09Z"
  },
  {
    "id": 905,
    "parent_run_id": "c5934461e9839235",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 609,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:10Z"
  },
  {
    "id": 906,
    "parent_run_id": "c5934461e9839235",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 709,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-11T05:03:11Z"
  },
  {
    "id": 907,
    "parent_run_id": "c5934461e9839235",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 582,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:11Z"
  },
  {
    "id": 908,
    "parent_run_id": "28e332c76a96e823",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 649,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:12Z"
  },
  {
    "id": 909,
    "parent_run_id": "28e332c76a96e823",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 661,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:12Z"
  },
  {
    "id": 910,
    "parent_run_id": "28e332c76a96e823",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1017,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:13Z"
  },
  {
    "id": 911,
    "parent_run_id": "019fa7e2e6d9de97",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 662,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:14Z"
  },
  {
    "id": 912,
    "parent_run_id": "019fa7e2e6d9de97",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1062,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:15Z"
  },
  {
    "id": 913,
    "parent_run_id": "019fa7e2e6d9de97",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 568,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:16Z"
  },
  {
    "id": 914,
    "parent_run_id": "fbb460fed7ae46df",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 717,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:17Z"
  },
  {
    "id": 915,
    "parent_run_id": "fbb460fed7ae46df",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2444,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-11T05:03:19Z"
  },
  {
    "id": 916,
    "parent_run_id": "fbb460fed7ae46df",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 667,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:20Z"
  },
  {
    "id": 917,
    "parent_run_id": "0cb34a080c965662",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 729,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:20Z"
  },
  {
    "id": 918,
    "parent_run_id": "0cb34a080c965662",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 953,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:21Z"
  },
  {
    "id": 919,
    "parent_run_id": "0cb34a080c965662",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 634,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:22Z"
  },
  {
    "id": 920,
    "parent_run_id": "070967f1b41d3d07",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 932,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:23Z"
  },
  {
    "id": 921,
    "parent_run_id": "070967f1b41d3d07",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1584,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:25Z"
  },
  {
    "id": 922,
    "parent_run_id": "070967f1b41d3d07",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 934,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:25Z"
  },
  {
    "id": 923,
    "parent_run_id": "ad84f606fe3068a5",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 613,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:26Z"
  },
  {
    "id": 924,
    "parent_run_id": "ad84f606fe3068a5",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1862,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-11T05:03:28Z"
  },
  {
    "id": 925,
    "parent_run_id": "ad84f606fe3068a5",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 932,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:29Z"
  },
  {
    "id": 926,
    "parent_run_id": "73a2154faadc8ebd",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 723,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-11T05:03:30Z"
  },
  {
    "id": 927,
    "parent_run_id": "64989df9c581c164",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 1002,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-11T05:03:31Z"
  },
  {
    "id": 928,
    "parent_run_id": "f26f3951f19c6737",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 789,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:31Z"
  },
  {
    "id": 929,
    "parent_run_id": "d492223367c1de04",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 751,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-11T05:03:32Z"
  },
  {
    "id": 930,
    "parent_run_id": "429a625ee51a8d7f",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 1409,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-11T05:03:34Z"
  },
  {
    "id": 931,
    "parent_run_id": "42664af6d5a29d00",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 628,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-11T05:03:34Z"
  },
  {
    "id": 941,
    "parent_run_id": "f1c5eaec138f5f63",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 1858,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-12T05:03:35Z"
  },
  {
    "id": 942,
    "parent_run_id": "c10a6cff8eacf4b2",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 1873,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-12T05:03:37Z"
  },
  {
    "id": 943,
    "parent_run_id": "bbb439c9a0f0ac7c",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 1596,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:39Z"
  },
  {
    "id": 944,
    "parent_run_id": "e38650a335150868",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 724,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:40Z"
  },
  {
    "id": 945,
    "parent_run_id": "e38650a335150868",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 695,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:40Z"
  },
  {
    "id": 946,
    "parent_run_id": "e38650a335150868",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 2085,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:42Z"
  },
  {
    "id": 947,
    "parent_run_id": "8d4c9bfd26faea37",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 744,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:43Z"
  },
  {
    "id": 948,
    "parent_run_id": "8d4c9bfd26faea37",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1384,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:44Z"
  },
  {
    "id": 949,
    "parent_run_id": "8d4c9bfd26faea37",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1723,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:46Z"
  },
  {
    "id": 950,
    "parent_run_id": "b2186731c4a3a62a",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 954,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:47Z"
  },
  {
    "id": 951,
    "parent_run_id": "b2186731c4a3a62a",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1660,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-12T05:03:49Z"
  },
  {
    "id": 952,
    "parent_run_id": "b2186731c4a3a62a",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1217,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:50Z"
  },
  {
    "id": 953,
    "parent_run_id": "da75badc48c004e9",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 721,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:51Z"
  },
  {
    "id": 954,
    "parent_run_id": "da75badc48c004e9",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 884,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:52Z"
  },
  {
    "id": 955,
    "parent_run_id": "da75badc48c004e9",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 2386,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:54Z"
  },
  {
    "id": 956,
    "parent_run_id": "1fd06dd96d306f72",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 854,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:55Z"
  },
  {
    "id": 957,
    "parent_run_id": "1fd06dd96d306f72",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 716,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:56Z"
  },
  {
    "id": 958,
    "parent_run_id": "1fd06dd96d306f72",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 555,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:56Z"
  },
  {
    "id": 959,
    "parent_run_id": "dd5d88077f31a9f9",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 841,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:57Z"
  },
  {
    "id": 960,
    "parent_run_id": "dd5d88077f31a9f9",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 579,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-12T05:03:58Z"
  },
  {
    "id": 961,
    "parent_run_id": "dd5d88077f31a9f9",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 580,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:58Z"
  },
  {
    "id": 962,
    "parent_run_id": "c683449898a36f3d",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 828,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-12T05:03:59Z"
  },
  {
    "id": 963,
    "parent_run_id": "c683449898a36f3d",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 900,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:00Z"
  },
  {
    "id": 964,
    "parent_run_id": "c683449898a36f3d",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 807,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:01Z"
  },
  {
    "id": 965,
    "parent_run_id": "800c0a18b6fce9c1",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 1020,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:02Z"
  },
  {
    "id": 966,
    "parent_run_id": "800c0a18b6fce9c1",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 1122,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:03Z"
  },
  {
    "id": 967,
    "parent_run_id": "800c0a18b6fce9c1",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 494,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:03Z"
  },
  {
    "id": 968,
    "parent_run_id": "c724f0956ef91ad4",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 675,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:04Z"
  },
  {
    "id": 969,
    "parent_run_id": "c724f0956ef91ad4",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 624,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-12T05:04:05Z"
  },
  {
    "id": 970,
    "parent_run_id": "c724f0956ef91ad4",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 596,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:05Z"
  },
  {
    "id": 971,
    "parent_run_id": "8b162fcfb6ba89ac",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 867,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:06Z"
  },
  {
    "id": 972,
    "parent_run_id": "8b162fcfb6ba89ac",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1069,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:07Z"
  },
  {
    "id": 973,
    "parent_run_id": "8b162fcfb6ba89ac",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 623,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:08Z"
  },
  {
    "id": 974,
    "parent_run_id": "40c48ca967600c93",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 857,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:09Z"
  },
  {
    "id": 975,
    "parent_run_id": "40c48ca967600c93",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1300,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:10Z"
  },
  {
    "id": 976,
    "parent_run_id": "40c48ca967600c93",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1053,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:11Z"
  },
  {
    "id": 977,
    "parent_run_id": "a77130be7c3214c7",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 960,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:12Z"
  },
  {
    "id": 978,
    "parent_run_id": "a77130be7c3214c7",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Positive",
    "expected": "neutral",
    "correct": 0,
    "latency_ms": 2612,
    "input_tokens": 9,
    "output_tokens": 2,
    "cost_eur": 1.2749999999999999e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:15Z"
  },
  {
    "id": 979,
    "parent_run_id": "a77130be7c3214c7",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 814,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:16Z"
  },
  {
    "id": 980,
    "parent_run_id": "7ec6ce9d1ea5cf71",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 909,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:17Z"
  },
  {
    "id": 981,
    "parent_run_id": "7ec6ce9d1ea5cf71",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 605,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:17Z"
  },
  {
    "id": 982,
    "parent_run_id": "7ec6ce9d1ea5cf71",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 582,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:18Z"
  },
  {
    "id": 983,
    "parent_run_id": "9c340909114f2552",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 841,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:19Z"
  },
  {
    "id": 984,
    "parent_run_id": "9c340909114f2552",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1358,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:20Z"
  },
  {
    "id": 985,
    "parent_run_id": "9c340909114f2552",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 447,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:20Z"
  },
  {
    "id": 986,
    "parent_run_id": "1f2f6e7813cc63ff",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 979,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:21Z"
  },
  {
    "id": 987,
    "parent_run_id": "1f2f6e7813cc63ff",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Positive",
    "expected": "neutral",
    "correct": 0,
    "latency_ms": 2767,
    "input_tokens": 9,
    "output_tokens": 2,
    "cost_eur": 1.2749999999999999e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:24Z"
  },
  {
    "id": 988,
    "parent_run_id": "1f2f6e7813cc63ff",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 5570,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:30Z"
  },
  {
    "id": 989,
    "parent_run_id": "786ad912bebf4cab",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 889,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-12T05:04:31Z"
  },
  {
    "id": 990,
    "parent_run_id": "4b9862e7881e41f4",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 1499,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-12T05:04:32Z"
  },
  {
    "id": 991,
    "parent_run_id": "11e6d4db0ca3dcc5",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 956,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:33Z"
  },
  {
    "id": 992,
    "parent_run_id": "21b5119c0f613ee9",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 1050,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-12T05:04:34Z"
  },
  {
    "id": 993,
    "parent_run_id": "ea0d2b7b34f5a530",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 788,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-12T05:04:35Z"
  },
  {
    "id": 994,
    "parent_run_id": "3468bf08b8960ea2",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 873,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T05:04:36Z"
  },
  {
    "id": 995,
    "parent_run_id": "608bc5b69b3912f5",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 1552,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-12T13:35:41Z"
  },
  {
    "id": 996,
    "parent_run_id": "8f77ce236c4a5b2d",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 939,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-12T13:35:42Z"
  },
  {
    "id": 997,
    "parent_run_id": "02c19df7c1d3523b",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 724,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:35:42Z"
  },
  {
    "id": 998,
    "parent_run_id": "29aa85cacd828fd9",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 865,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:35:43Z"
  },
  {
    "id": 999,
    "parent_run_id": "29aa85cacd828fd9",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1232,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:35:44Z"
  },
  {
    "id": 1000,
    "parent_run_id": "29aa85cacd828fd9",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 2150,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-12T13:35:47Z"
  },
  {
    "id": 1001,
    "parent_run_id": "9efd9824d03f7a9e",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 790,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:35:47Z"
  },
  {
    "id": 1002,
    "parent_run_id": "9efd9824d03f7a9e",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1483,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:35:49Z"
  },
  {
    "id": 1003,
    "parent_run_id": "9efd9824d03f7a9e",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1048,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-12T13:35:50Z"
  },
  {
    "id": 1004,
    "parent_run_id": "bc6a70a2df7511aa",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1288,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:35:51Z"
  },
  {
    "id": 1005,
    "parent_run_id": "bc6a70a2df7511aa",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2131,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-12T13:35:53Z"
  },
  {
    "id": 1006,
    "parent_run_id": "bc6a70a2df7511aa",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2375,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-12T13:35:56Z"
  },
  {
    "id": 1007,
    "parent_run_id": "3ca117c544ae3cdc",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 1043,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-12T13:35:57Z"
  },
  {
    "id": 1008,
    "parent_run_id": "3ca117c544ae3cdc",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 622,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-12T13:35:57Z"
  },
  {
    "id": 1009,
    "parent_run_id": "3ca117c544ae3cdc",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 1032,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-12T13:35:58Z"
  },
  {
    "id": 1010,
    "parent_run_id": "b6593e371bbe612b",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 804,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-12T13:35:59Z"
  },
  {
    "id": 1011,
    "parent_run_id": "b6593e371bbe612b",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 714,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:00Z"
  },
  {
    "id": 1012,
    "parent_run_id": "b6593e371bbe612b",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 644,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:01Z"
  },
  {
    "id": 1013,
    "parent_run_id": "bdda6da6bc5a12f4",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 838,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:01Z"
  },
  {
    "id": 1014,
    "parent_run_id": "bdda6da6bc5a12f4",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 713,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-12T13:36:02Z"
  },
  {
    "id": 1015,
    "parent_run_id": "bdda6da6bc5a12f4",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 1072,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:03Z"
  },
  {
    "id": 1016,
    "parent_run_id": "d81b65a1ed20dd9c",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 882,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:04Z"
  },
  {
    "id": 1017,
    "parent_run_id": "d81b65a1ed20dd9c",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 540,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:05Z"
  },
  {
    "id": 1018,
    "parent_run_id": "d81b65a1ed20dd9c",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 883,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:06Z"
  },
  {
    "id": 1019,
    "parent_run_id": "d709bd8ec8b2c4bd",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 913,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:06Z"
  },
  {
    "id": 1020,
    "parent_run_id": "d709bd8ec8b2c4bd",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 752,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:07Z"
  },
  {
    "id": 1021,
    "parent_run_id": "d709bd8ec8b2c4bd",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 598,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:08Z"
  },
  {
    "id": 1022,
    "parent_run_id": "852317b59cc48997",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 682,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:08Z"
  },
  {
    "id": 1023,
    "parent_run_id": "852317b59cc48997",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 740,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-12T13:36:09Z"
  },
  {
    "id": 1024,
    "parent_run_id": "852317b59cc48997",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 784,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:10Z"
  },
  {
    "id": 1025,
    "parent_run_id": "4031fceafb575913",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 813,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:11Z"
  },
  {
    "id": 1026,
    "parent_run_id": "4031fceafb575913",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1422,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:12Z"
  },
  {
    "id": 1027,
    "parent_run_id": "4031fceafb575913",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 610,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:13Z"
  },
  {
    "id": 1028,
    "parent_run_id": "e45edaef19de21d9",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 2059,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:15Z"
  },
  {
    "id": 1029,
    "parent_run_id": "e45edaef19de21d9",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1272,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:16Z"
  },
  {
    "id": 1030,
    "parent_run_id": "e45edaef19de21d9",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 459,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:17Z"
  },
  {
    "id": 1031,
    "parent_run_id": "74b8014aedb1546b",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1341,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:18Z"
  },
  {
    "id": 1032,
    "parent_run_id": "74b8014aedb1546b",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2111,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-12T13:36:20Z"
  },
  {
    "id": 1033,
    "parent_run_id": "74b8014aedb1546b",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1183,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:21Z"
  },
  {
    "id": 1034,
    "parent_run_id": "69631b5ca0482dfd",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 847,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:22Z"
  },
  {
    "id": 1035,
    "parent_run_id": "69631b5ca0482dfd",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1678,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:24Z"
  },
  {
    "id": 1036,
    "parent_run_id": "69631b5ca0482dfd",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 988,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:25Z"
  },
  {
    "id": 1037,
    "parent_run_id": "dbc00df5af63ae9c",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 992,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:26Z"
  },
  {
    "id": 1038,
    "parent_run_id": "dbc00df5af63ae9c",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1552,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:27Z"
  },
  {
    "id": 1039,
    "parent_run_id": "dbc00df5af63ae9c",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 647,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:28Z"
  },
  {
    "id": 1040,
    "parent_run_id": "3f0c4795e2af116d",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 868,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:29Z"
  },
  {
    "id": 1041,
    "parent_run_id": "3f0c4795e2af116d",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1703,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-12T13:36:31Z"
  },
  {
    "id": 1042,
    "parent_run_id": "3f0c4795e2af116d",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 843,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:32Z"
  },
  {
    "id": 1043,
    "parent_run_id": "e75615bc9d618ce1",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 1067,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-12T13:36:33Z"
  },
  {
    "id": 1044,
    "parent_run_id": "725339ddd0d0b13e",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 1059,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-12T13:36:34Z"
  },
  {
    "id": 1045,
    "parent_run_id": "dbcf26cee3f8816e",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 680,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:34Z"
  },
  {
    "id": 1046,
    "parent_run_id": "c346752cf959c2b3",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 1033,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-12T13:36:35Z"
  },
  {
    "id": 1047,
    "parent_run_id": "6ca8dbe3c9e43c54",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 907,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-12T13:36:36Z"
  },
  {
    "id": 1048,
    "parent_run_id": "df3750fa69b23e61",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 1961,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-12T13:36:38Z"
  },
  {
    "id": 1051,
    "parent_run_id": "b312fcd301e93528",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 1369,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-13T05:03:36Z"
  },
  {
    "id": 1052,
    "parent_run_id": "dc05ed43237325cf",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 1219,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-13T05:03:37Z"
  },
  {
    "id": 1053,
    "parent_run_id": "00c796b9f393cbcd",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 611,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:38Z"
  },
  {
    "id": 1054,
    "parent_run_id": "7549084aa7a1c856",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 810,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:38Z"
  },
  {
    "id": 1055,
    "parent_run_id": "7549084aa7a1c856",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 677,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:39Z"
  },
  {
    "id": 1056,
    "parent_run_id": "7549084aa7a1c856",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1745,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:41Z"
  },
  {
    "id": 1057,
    "parent_run_id": "f26aa6829aff6bb1",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 679,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:41Z"
  },
  {
    "id": 1058,
    "parent_run_id": "f26aa6829aff6bb1",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 783,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:42Z"
  },
  {
    "id": 1059,
    "parent_run_id": "f26aa6829aff6bb1",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 2555,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:45Z"
  },
  {
    "id": 1060,
    "parent_run_id": "fd1f97c9ab033e1a",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1806,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:47Z"
  },
  {
    "id": 1061,
    "parent_run_id": "fd1f97c9ab033e1a",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Positive",
    "expected": "neutral",
    "correct": 0,
    "latency_ms": 3168,
    "input_tokens": 9,
    "output_tokens": 2,
    "cost_eur": 1.2749999999999999e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:50Z"
  },
  {
    "id": 1062,
    "parent_run_id": "fd1f97c9ab033e1a",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 1215,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:51Z"
  },
  {
    "id": 1063,
    "parent_run_id": "25bd972743c7affc",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 1001,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:52Z"
  },
  {
    "id": 1064,
    "parent_run_id": "25bd972743c7affc",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 650,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:53Z"
  },
  {
    "id": 1065,
    "parent_run_id": "25bd972743c7affc",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 916,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:54Z"
  },
  {
    "id": 1066,
    "parent_run_id": "a5fe9fd0cb14c248",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 1141,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:55Z"
  },
  {
    "id": 1067,
    "parent_run_id": "a5fe9fd0cb14c248",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 595,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:55Z"
  },
  {
    "id": 1068,
    "parent_run_id": "a5fe9fd0cb14c248",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 603,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:56Z"
  },
  {
    "id": 1069,
    "parent_run_id": "eef055f8c0385523",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 792,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:57Z"
  },
  {
    "id": 1070,
    "parent_run_id": "eef055f8c0385523",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 779,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-13T05:03:58Z"
  },
  {
    "id": 1071,
    "parent_run_id": "eef055f8c0385523",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 658,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:58Z"
  },
  {
    "id": 1072,
    "parent_run_id": "dbc640de0367d75c",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 888,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 3.75e-06,
    "error": null,
    "created_at": "2026-05-13T05:03:59Z"
  },
  {
    "id": 1073,
    "parent_run_id": "dbc640de0367d75c",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 616,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 1.0500000000000001e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:00Z"
  },
  {
    "id": 1074,
    "parent_run_id": "dbc640de0367d75c",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hello world how are you doing today friend... [sha256:ccb2e90bed48]",
    "output_text": "en",
    "expected": "en",
    "correct": 1,
    "latency_ms": 920,
    "input_tokens": 10,
    "output_tokens": 1,
    "cost_eur": 2.1000000000000002e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:01Z"
  },
  {
    "id": 1075,
    "parent_run_id": "72d93e466fb43b14",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 717,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 4e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:01Z"
  },
  {
    "id": 1076,
    "parent_run_id": "72d93e466fb43b14",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 995,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 1.125e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:02Z"
  },
  {
    "id": 1077,
    "parent_run_id": "72d93e466fb43b14",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Bonjour comment allez-vous aujourd'hui mon ami... [sha256:98ecb16237cb]",
    "output_text": "fr",
    "expected": "fr",
    "correct": 1,
    "latency_ms": 799,
    "input_tokens": 11,
    "output_tokens": 1,
    "cost_eur": 2.25e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:03Z"
  },
  {
    "id": 1078,
    "parent_run_id": "7961d8c5b60e562c",
    "task_class": "detect_language",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 834,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:04Z"
  },
  {
    "id": 1079,
    "parent_run_id": "7961d8c5b60e562c",
    "task_class": "detect_language",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 604,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-13T05:04:05Z"
  },
  {
    "id": 1080,
    "parent_run_id": "7961d8c5b60e562c",
    "task_class": "detect_language",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "Hallo wie geht es dir heute mein Freund... [sha256:bbe7abb8a492]",
    "output_text": "de",
    "expected": "de",
    "correct": 1,
    "latency_ms": 365,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:05Z"
  },
  {
    "id": 1081,
    "parent_run_id": "3e82a6be19faec60",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 699,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:06Z"
  },
  {
    "id": 1082,
    "parent_run_id": "3e82a6be19faec60",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 703,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:06Z"
  },
  {
    "id": 1083,
    "parent_run_id": "3e82a6be19faec60",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 641,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:07Z"
  },
  {
    "id": 1084,
    "parent_run_id": "f434bb6444421cd7",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 593,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:08Z"
  },
  {
    "id": 1085,
    "parent_run_id": "f434bb6444421cd7",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1081,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:09Z"
  },
  {
    "id": 1086,
    "parent_run_id": "f434bb6444421cd7",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 467,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:09Z"
  },
  {
    "id": 1087,
    "parent_run_id": "3e5a159a15cb9481",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 595,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:10Z"
  },
  {
    "id": 1088,
    "parent_run_id": "3e5a159a15cb9481",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2330,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 9.749999999999998e-07,
    "error": null,
    "created_at": "2026-05-13T05:04:12Z"
  },
  {
    "id": 1089,
    "parent_run_id": "3e5a159a15cb9481",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 3390,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:16Z"
  },
  {
    "id": 1090,
    "parent_run_id": "0dcaf16cc43ff8fc",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 658,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:16Z"
  },
  {
    "id": 1091,
    "parent_run_id": "0dcaf16cc43ff8fc",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 1278,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:17Z"
  },
  {
    "id": 1092,
    "parent_run_id": "0dcaf16cc43ff8fc",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "I absolutely love this product it works perfectly... [sha256:6e49d8ee8854]",
    "output_text": "Positive",
    "expected": "positive",
    "correct": 1,
    "latency_ms": 704,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:18Z"
  },
  {
    "id": 1093,
    "parent_run_id": "9628d7920f88d377",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 761,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:19Z"
  },
  {
    "id": 1094,
    "parent_run_id": "9628d7920f88d377",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 1298,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 1.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:20Z"
  },
  {
    "id": 1095,
    "parent_run_id": "9628d7920f88d377",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "This was a terrible experience I want my money back... [sha256:d0e80c5d2076]",
    "output_text": "Negative",
    "expected": "negative",
    "correct": 1,
    "latency_ms": 523,
    "input_tokens": 12,
    "output_tokens": 2,
    "cost_eur": 3e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:21Z"
  },
  {
    "id": 1096,
    "parent_run_id": "7b94478bff0bbeaa",
    "task_class": "classify_sentiment",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 668,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 3.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:21Z"
  },
  {
    "id": 1097,
    "parent_run_id": "7b94478bff0bbeaa",
    "task_class": "classify_sentiment",
    "subtask_idx": 1,
    "provider": "gemini",
    "model_name": "gemini",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "Positive",
    "expected": "neutral",
    "correct": 0,
    "latency_ms": 3125,
    "input_tokens": 9,
    "output_tokens": 2,
    "cost_eur": 1.2749999999999999e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:25Z"
  },
  {
    "id": 1098,
    "parent_run_id": "7b94478bff0bbeaa",
    "task_class": "classify_sentiment",
    "subtask_idx": 2,
    "provider": "openai",
    "model_name": "openai",
    "input_text": "The package arrived on Tuesday morning... [sha256:ab25ceb1f147]",
    "output_text": "neutral",
    "expected": "neutral",
    "correct": 1,
    "latency_ms": 2682,
    "input_tokens": 9,
    "output_tokens": 1,
    "cost_eur": 1.9499999999999995e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:27Z"
  },
  {
    "id": 1099,
    "parent_run_id": "53b02ef085cccc69",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 739,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-13T05:04:28Z"
  },
  {
    "id": 1100,
    "parent_run_id": "e613827564a117b4",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 812,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-13T05:04:29Z"
  },
  {
    "id": 1101,
    "parent_run_id": "cdc2683114e00aeb",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 603,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:29Z"
  },
  {
    "id": 1102,
    "parent_run_id": "30f56f4a848f636c",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Reach out to alice@example.com or bob.smith@test.org for hel... [sha256:c2c3fcfc308f]",
    "output_text": "```json\n[\"alice@example.com\", \"bob.smith@test.org\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"alice@example.com\", \"bob.smith@test.org\"]",
    "correct": 1,
    "latency_ms": 722,
    "input_tokens": 15,
    "output_tokens": 13,
    "cost_eur": 2e-05,
    "error": null,
    "created_at": "2026-05-13T05:04:30Z"
  },
  {
    "id": 1103,
    "parent_run_id": "eed132185f667bd6",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "Email me at hello@astranl.com please.... [sha256:5bd48f83cce8]",
    "output_text": "```json\n[\"hello@astranl.com\"]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[\"hello@astranl.com\"]",
    "correct": 1,
    "latency_ms": 849,
    "input_tokens": 9,
    "output_tokens": 8,
    "cost_eur": 1.225e-05,
    "error": null,
    "created_at": "2026-05-13T05:04:31Z"
  },
  {
    "id": 1104,
    "parent_run_id": "b6306081392154e3",
    "task_class": "extract_emails",
    "subtask_idx": 0,
    "provider": "anthropic",
    "model_name": "anthropic",
    "input_text": "No emails in this text at all.... [sha256:126563e18796]",
    "output_text": "```json\n[]\n```\n[reeval_2026_05_15: markdown-stripped match]",
    "expected": "[]",
    "correct": 1,
    "latency_ms": 1031,
    "input_tokens": 7,
    "output_tokens": 3,
    "cost_eur": 5.5e-06,
    "error": null,
    "created_at": "2026-05-13T05:04:32Z"
  }
]