796 lines
20 KiB
JSON
796 lines
20 KiB
JSON
{
|
|
"results": [
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T10:56:09.502Z",
|
|
"passed": true,
|
|
"duration": 1237
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T10:56:13.802Z",
|
|
"passed": true,
|
|
"duration": 4298
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T10:56:15.214Z",
|
|
"passed": true,
|
|
"duration": 1411
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T10:56:18.337Z",
|
|
"passed": true,
|
|
"duration": 3122
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T10:56:18.922Z",
|
|
"passed": true,
|
|
"duration": 583
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T10:56:22.539Z",
|
|
"passed": true,
|
|
"duration": 3615
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:01:08.904Z",
|
|
"passed": true,
|
|
"duration": 1888
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:01:15.210Z",
|
|
"passed": true,
|
|
"duration": 6304
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:01:16.502Z",
|
|
"passed": true,
|
|
"duration": 1291
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:01:18.728Z",
|
|
"passed": true,
|
|
"duration": 2225
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:01:19.938Z",
|
|
"passed": true,
|
|
"duration": 1209
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:01:27.791Z",
|
|
"passed": true,
|
|
"duration": 7852
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:16:21.370Z",
|
|
"passed": true,
|
|
"duration": 1213,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:16:24.898Z",
|
|
"passed": true,
|
|
"duration": 3524,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "openai/gpt-4o-mini",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:16:25.624Z",
|
|
"passed": true,
|
|
"duration": 724,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "openai/gpt-3.5-turbo",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:16:26.630Z",
|
|
"passed": true,
|
|
"duration": 1005,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:16:27.812Z",
|
|
"passed": true,
|
|
"duration": 1178,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:16:31.317Z",
|
|
"passed": true,
|
|
"duration": 3503,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "openai/gpt-4o-mini",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:16:32.288Z",
|
|
"passed": true,
|
|
"duration": 969,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "openai/gpt-3.5-turbo",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:16:33.147Z",
|
|
"passed": true,
|
|
"duration": 858,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:16:33.724Z",
|
|
"passed": true,
|
|
"duration": 576,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:16:34.841Z",
|
|
"passed": true,
|
|
"duration": 1115,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "openai/gpt-4o-mini",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:16:35.673Z",
|
|
"passed": true,
|
|
"duration": 831,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "openai/gpt-3.5-turbo",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:16:36.762Z",
|
|
"passed": true,
|
|
"duration": 1087,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:20:25.749Z",
|
|
"passed": true,
|
|
"duration": 1644,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:20:31.261Z",
|
|
"passed": true,
|
|
"duration": 5507,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "openai/gpt-4o-mini",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:20:32.131Z",
|
|
"passed": true,
|
|
"duration": 869,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "openai/gpt-3.5-turbo",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:20:33.306Z",
|
|
"passed": true,
|
|
"duration": 1173,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:20:34.323Z",
|
|
"passed": true,
|
|
"duration": 1016,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:20:38.976Z",
|
|
"passed": true,
|
|
"duration": 4651,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "openai/gpt-4o-mini",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:20:39.914Z",
|
|
"passed": true,
|
|
"duration": 937,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "openai/gpt-3.5-turbo",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:20:41.053Z",
|
|
"passed": true,
|
|
"duration": 1137,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:20:42.918Z",
|
|
"passed": true,
|
|
"duration": 1863,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:20:47.234Z",
|
|
"passed": true,
|
|
"duration": 4314,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "openai/gpt-4o-mini",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:20:47.966Z",
|
|
"passed": true,
|
|
"duration": 730,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "openai/gpt-3.5-turbo",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:20:48.941Z",
|
|
"passed": true,
|
|
"duration": 973,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:25:15.745Z",
|
|
"passed": true,
|
|
"duration": 1951,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:25:19.476Z",
|
|
"passed": true,
|
|
"duration": 3726,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "openai/gpt-4o-mini",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:25:20.854Z",
|
|
"passed": true,
|
|
"duration": 1376,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "openai/gpt-3.5-turbo",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:25:28.044Z",
|
|
"passed": true,
|
|
"duration": 7188,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "deepseek/deepseek-r1",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:25:43.203Z",
|
|
"passed": true,
|
|
"duration": 15157,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "addition",
|
|
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"8"
|
|
],
|
|
"expected": "8",
|
|
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:25:50.736Z",
|
|
"passed": true,
|
|
"duration": 7531,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:25:51.834Z",
|
|
"passed": true,
|
|
"duration": 1096,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:25:55.428Z",
|
|
"passed": true,
|
|
"duration": 3592,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "openai/gpt-4o-mini",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:25:56.874Z",
|
|
"passed": true,
|
|
"duration": 1444,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "openai/gpt-3.5-turbo",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:25:57.746Z",
|
|
"passed": true,
|
|
"duration": 870,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "deepseek/deepseek-r1",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:26:08.731Z",
|
|
"passed": true,
|
|
"duration": 10983,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"24"
|
|
],
|
|
"expected": "24",
|
|
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:26:14.379Z",
|
|
"passed": true,
|
|
"duration": 5646,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:26:15.658Z",
|
|
"passed": true,
|
|
"duration": 1276,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "qwen/qwq-32b",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:26:21.428Z",
|
|
"passed": true,
|
|
"duration": 5768,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "openai/gpt-4o-mini",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:26:22.358Z",
|
|
"passed": true,
|
|
"duration": 929,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "openai/gpt-3.5-turbo",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:26:23.155Z",
|
|
"passed": true,
|
|
"duration": 794,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "deepseek/deepseek-r1",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:26:38.566Z",
|
|
"passed": true,
|
|
"duration": 15409,
|
|
"category": "basic"
|
|
},
|
|
{
|
|
"test": "division",
|
|
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
|
"result": [
|
|
"5"
|
|
],
|
|
"expected": "5",
|
|
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-02T11:26:40.358Z",
|
|
"passed": true,
|
|
"duration": 1790,
|
|
"category": "basic"
|
|
}
|
|
],
|
|
"highscores": [
|
|
{
|
|
"test": "addition",
|
|
"rankings": [
|
|
{
|
|
"model": "openai/gpt-4o-mini",
|
|
"duration": 1376,
|
|
"duration_secs": 1.376
|
|
},
|
|
{
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"duration": 1951,
|
|
"duration_secs": 1.951
|
|
}
|
|
]
|
|
},
|
|
{
|
|
"test": "multiplication",
|
|
"rankings": [
|
|
{
|
|
"model": "openai/gpt-3.5-turbo",
|
|
"duration": 870,
|
|
"duration_secs": 0.87
|
|
},
|
|
{
|
|
"model": "anthropic/claude-3.5-sonnet",
|
|
"duration": 1096,
|
|
"duration_secs": 1.096
|
|
}
|
|
]
|
|
},
|
|
{
|
|
"test": "division",
|
|
"rankings": [
|
|
{
|
|
"model": "openai/gpt-3.5-turbo",
|
|
"duration": 794,
|
|
"duration_secs": 0.794
|
|
},
|
|
{
|
|
"model": "openai/gpt-4o-mini",
|
|
"duration": 929,
|
|
"duration_secs": 0.929
|
|
}
|
|
]
|
|
}
|
|
],
|
|
"lastUpdated": "2025-04-02T11:26:40.358Z"
|
|
} |