mirror of
https://github.com/wassname/Judgemark-v2lp.git
synced 2026-06-27 16:10:14 +08:00
12249 lines
321 KiB
JSON
12249 lines
321 KiB
JSON
{
|
|
"judge_model": "deepseek/deepseek-r1-distill-qwen-14b",
|
|
"start_time": "2025-01-30T21:28:21.658753",
|
|
"status": "running",
|
|
"samples_file": "data/judgemark_v2.1_samples.json",
|
|
"prompts_file": "data/judge_prompts.json",
|
|
"errors": [
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-5-sonnet-20240620",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb10521f30>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb106a2950>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb106005e0>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb10602710>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb106ecaf0>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb106ee320>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb106eda50>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb106a0ee0>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb106ec8b0>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb28486ec0>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb28485ab0>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb10640be0>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb10641930>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb10643f10>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb10641450>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb105785e0>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb2844ee00>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb2ad90130>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb283f27a0>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb283c0f70>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb106ca050>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb28486050>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "HTTPSConnectionPool(host='openrouter.ai', port=443): Max retries exceeded with url: /api/v1/chat/completions (Caused by NameResolutionError(\"<urllib3.connection.HTTPSConnection object at 0x7fcb105222f0>: Failed to resolve 'openrouter.ai' ([Errno -3] Temporary failure in name resolution)\"))"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-haiku-20240307",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "claude-3-opus-20240229",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-001",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-3-70b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x7B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Llama-2-13b-chat-hf",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-7b-it",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemma-2b-it",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mixtral-8x22B-Instruct-v0.1",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "c4ai-command-r-08-2024",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gemini-1.5-pro-002",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "Mistral-Large-Instruct-2411",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-4o-2024-11-20",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "DeepSeek-R1",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "gpt-3.5-turbo-0125",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "1",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "2",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "3",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "4",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "2",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "6",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "9",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "10",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "19",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "20",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "22",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "26",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "27",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "28",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "29",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "30",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "31",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "32",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "33",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "34",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "35",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "36",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "37",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "38",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "41",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "42",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "43",
|
|
"error": "'choices'"
|
|
},
|
|
{
|
|
"model": "databricks/dbrx-instruct",
|
|
"iteration": "5",
|
|
"item_id": "44",
|
|
"error": "'choices'"
|
|
}
|
|
]
|
|
} |