8670 lines
381 KiB
JSON
8670 lines
381 KiB
JSON
{
|
||
"results": [
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:13:10.276Z",
|
||
"passed": false,
|
||
"duration": 1242,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:13:31.650Z",
|
||
"passed": false,
|
||
"duration": 21368,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:13:34.699Z",
|
||
"passed": true,
|
||
"duration": 3046,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:13:45.957Z",
|
||
"passed": true,
|
||
"duration": 11256,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:13:47.935Z",
|
||
"passed": true,
|
||
"duration": 1976,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:14:07.714Z",
|
||
"passed": false,
|
||
"duration": 19778,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:14:08.883Z",
|
||
"passed": true,
|
||
"duration": 1167,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:14:12.225Z",
|
||
"passed": true,
|
||
"duration": 3341,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:14:12.889Z",
|
||
"passed": true,
|
||
"duration": 663,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:14:32.527Z",
|
||
"passed": true,
|
||
"duration": 19636,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:16:21.370Z",
|
||
"passed": true,
|
||
"duration": 1213,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:16:24.898Z",
|
||
"passed": true,
|
||
"duration": 3524,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:16:25.624Z",
|
||
"passed": true,
|
||
"duration": 724,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:16:26.630Z",
|
||
"passed": true,
|
||
"duration": 1005,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:16:27.812Z",
|
||
"passed": true,
|
||
"duration": 1178,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:16:31.317Z",
|
||
"passed": true,
|
||
"duration": 3503,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:16:32.288Z",
|
||
"passed": true,
|
||
"duration": 969,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:16:33.147Z",
|
||
"passed": true,
|
||
"duration": 858,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:16:33.724Z",
|
||
"passed": true,
|
||
"duration": 576,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:16:34.841Z",
|
||
"passed": true,
|
||
"duration": 1115,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:16:35.673Z",
|
||
"passed": true,
|
||
"duration": 831,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:16:36.762Z",
|
||
"passed": true,
|
||
"duration": 1087,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:20:25.749Z",
|
||
"passed": true,
|
||
"duration": 1644,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:20:31.261Z",
|
||
"passed": true,
|
||
"duration": 5507,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:20:32.131Z",
|
||
"passed": true,
|
||
"duration": 869,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:20:33.306Z",
|
||
"passed": true,
|
||
"duration": 1173,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:20:34.323Z",
|
||
"passed": true,
|
||
"duration": 1016,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:20:38.976Z",
|
||
"passed": true,
|
||
"duration": 4651,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:20:39.914Z",
|
||
"passed": true,
|
||
"duration": 937,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:20:41.053Z",
|
||
"passed": true,
|
||
"duration": 1137,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:20:42.918Z",
|
||
"passed": true,
|
||
"duration": 1863,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:20:47.234Z",
|
||
"passed": true,
|
||
"duration": 4314,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:20:47.966Z",
|
||
"passed": true,
|
||
"duration": 730,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:20:48.941Z",
|
||
"passed": true,
|
||
"duration": 973,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:10.419Z",
|
||
"passed": false,
|
||
"duration": 1650,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-3,-2"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:20.647Z",
|
||
"passed": true,
|
||
"duration": 10222,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:21.643Z",
|
||
"passed": false,
|
||
"duration": 994,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:22.524Z",
|
||
"passed": false,
|
||
"duration": 878,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:23.496Z",
|
||
"passed": true,
|
||
"duration": 970,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:28.452Z",
|
||
"passed": true,
|
||
"duration": 4954,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:29.325Z",
|
||
"passed": true,
|
||
"duration": 872,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:30.109Z",
|
||
"passed": true,
|
||
"duration": 782,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:33.902Z",
|
||
"passed": true,
|
||
"duration": 3791,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:46.225Z",
|
||
"passed": false,
|
||
"duration": 12322,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:47.202Z",
|
||
"passed": false,
|
||
"duration": 974,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:48.005Z",
|
||
"passed": true,
|
||
"duration": 800,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:48.763Z",
|
||
"passed": true,
|
||
"duration": 756,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:55.510Z",
|
||
"passed": true,
|
||
"duration": 6745,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:56.297Z",
|
||
"passed": true,
|
||
"duration": 785,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:57.051Z",
|
||
"passed": true,
|
||
"duration": 751,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:22:58.294Z",
|
||
"passed": true,
|
||
"duration": 1241,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:23:04.551Z",
|
||
"passed": false,
|
||
"duration": 6255,
|
||
"reason": "Model returned empty response",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:23:05.297Z",
|
||
"passed": true,
|
||
"duration": 743,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:23:06.018Z",
|
||
"passed": true,
|
||
"duration": 719,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:24:32.237Z",
|
||
"passed": false,
|
||
"duration": 1533,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-3, -2"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:24:50.178Z",
|
||
"passed": false,
|
||
"duration": 17934,
|
||
"reason": "Expected -3,-2, but got -3, -2",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:24:51.040Z",
|
||
"passed": false,
|
||
"duration": 859,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:24:51.938Z",
|
||
"passed": false,
|
||
"duration": 895,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:25:15.745Z",
|
||
"passed": true,
|
||
"duration": 1951,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:25:19.476Z",
|
||
"passed": true,
|
||
"duration": 3726,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:25:20.854Z",
|
||
"passed": true,
|
||
"duration": 1376,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:25:28.044Z",
|
||
"passed": true,
|
||
"duration": 7188,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:25:43.203Z",
|
||
"passed": true,
|
||
"duration": 15157,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:25:50.736Z",
|
||
"passed": true,
|
||
"duration": 7531,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:25:51.834Z",
|
||
"passed": true,
|
||
"duration": 1096,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:25:55.428Z",
|
||
"passed": true,
|
||
"duration": 3592,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:25:56.874Z",
|
||
"passed": true,
|
||
"duration": 1444,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:25:57.746Z",
|
||
"passed": true,
|
||
"duration": 870,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:26:08.731Z",
|
||
"passed": true,
|
||
"duration": 10983,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:26:14.379Z",
|
||
"passed": true,
|
||
"duration": 5646,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:26:15.658Z",
|
||
"passed": true,
|
||
"duration": 1276,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:26:21.428Z",
|
||
"passed": true,
|
||
"duration": 5768,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:26:22.358Z",
|
||
"passed": true,
|
||
"duration": 929,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:26:23.155Z",
|
||
"passed": true,
|
||
"duration": 794,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:26:38.566Z",
|
||
"passed": true,
|
||
"duration": 15409,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "openrouter",
|
||
"timestamp": "2025-04-02T11:26:40.358Z",
|
||
"passed": true,
|
||
"duration": 1790,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:22:28.224Z",
|
||
"passed": false,
|
||
"duration": 1311,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [],
|
||
"expected": "-3,-2",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:22:58.238Z",
|
||
"passed": false,
|
||
"duration": 30008,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:137:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:22:59.263Z",
|
||
"passed": false,
|
||
"duration": 1022,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-3, -2"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:23:00.561Z",
|
||
"passed": false,
|
||
"duration": 1294,
|
||
"reason": "Expected -3,-2, but got -3, -2",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:23:17.772Z",
|
||
"passed": false,
|
||
"duration": 17208,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:23:28.819Z",
|
||
"passed": false,
|
||
"duration": 11043,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:23:30.914Z",
|
||
"passed": true,
|
||
"duration": 2093,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:23:36.265Z",
|
||
"passed": true,
|
||
"duration": 5349,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:23:37.084Z",
|
||
"passed": true,
|
||
"duration": 816,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:23:38.020Z",
|
||
"passed": true,
|
||
"duration": 934,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:23:49.147Z",
|
||
"passed": true,
|
||
"duration": 11125,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:23:52.904Z",
|
||
"passed": true,
|
||
"duration": 3755,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:23:54.223Z",
|
||
"passed": true,
|
||
"duration": 1316,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:24:24.234Z",
|
||
"passed": false,
|
||
"duration": 30009,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:137:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:24:25.494Z",
|
||
"passed": false,
|
||
"duration": 1257,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:24:26.272Z",
|
||
"passed": true,
|
||
"duration": 776,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:24:56.284Z",
|
||
"passed": false,
|
||
"duration": 30009,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:137:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"The 6th number in the Fibonacci sequence is 5."
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:25:06.273Z",
|
||
"passed": false,
|
||
"duration": 9986,
|
||
"reason": "Expected 8, but got the 6th number in the fibonacci sequence is 5.",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:25:07.072Z",
|
||
"passed": true,
|
||
"duration": 795,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:25:12.207Z",
|
||
"passed": true,
|
||
"duration": 5133,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:25:13.308Z",
|
||
"passed": true,
|
||
"duration": 1099,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:25:14.724Z",
|
||
"passed": true,
|
||
"duration": 1414,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:25:24.633Z",
|
||
"passed": true,
|
||
"duration": 9907,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:25:28.285Z",
|
||
"passed": true,
|
||
"duration": 3650,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:25:31.067Z",
|
||
"passed": true,
|
||
"duration": 2779,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:25:35.904Z",
|
||
"passed": true,
|
||
"duration": 4834,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:25:36.993Z",
|
||
"passed": true,
|
||
"duration": 1087,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:25:37.796Z",
|
||
"passed": true,
|
||
"duration": 800,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:25:48.323Z",
|
||
"passed": true,
|
||
"duration": 10524,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"The result of 2 raised to the power of 3 is 8.\n\nAnswer: 8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:26:02.730Z",
|
||
"passed": false,
|
||
"duration": 14405,
|
||
"reason": "Expected 8, but got the result of 2 raised to the power of 3 is 8.\n\nanswer: 8",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:30:35.457Z",
|
||
"passed": false,
|
||
"duration": 3064,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-3,-2"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:30:47.981Z",
|
||
"passed": true,
|
||
"duration": 12517,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:30:49.084Z",
|
||
"passed": false,
|
||
"duration": 1100,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:30:50.009Z",
|
||
"passed": false,
|
||
"duration": 921,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:31:24.046Z",
|
||
"passed": false,
|
||
"duration": 2341,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:32:31.578Z",
|
||
"passed": false,
|
||
"duration": 3137,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:32:51.448Z",
|
||
"passed": false,
|
||
"duration": 1892,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-3,-2"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:32:58.250Z",
|
||
"passed": true,
|
||
"duration": 6795,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:32:59.105Z",
|
||
"passed": false,
|
||
"duration": 853,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:32:59.942Z",
|
||
"passed": false,
|
||
"duration": 832,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:33:19.796Z",
|
||
"passed": false,
|
||
"duration": 19850,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"The solutions to the quadratic equation x² + 5x + 6 = 0 are x = -2 and x = -3.\n\n-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:33:35.611Z",
|
||
"passed": false,
|
||
"duration": 15811,
|
||
"reason": "Expected -3,-2, but got the solutions to the quadratic equation x² + 5x + 6 = 0 are x = -2 and x = -3.\n\n-2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:33:37.469Z",
|
||
"passed": true,
|
||
"duration": 1853,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:33:44.364Z",
|
||
"passed": true,
|
||
"duration": 6892,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:33:45.323Z",
|
||
"passed": true,
|
||
"duration": 956,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:33:46.153Z",
|
||
"passed": true,
|
||
"duration": 827,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:33:57.349Z",
|
||
"passed": true,
|
||
"duration": 11193,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:34:02.166Z",
|
||
"passed": true,
|
||
"duration": 4814,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:34:04.174Z",
|
||
"passed": true,
|
||
"duration": 2004,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:34:05.686Z",
|
||
"passed": false,
|
||
"duration": 1509,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:34:07.363Z",
|
||
"passed": true,
|
||
"duration": 1673,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:34:08.909Z",
|
||
"passed": true,
|
||
"duration": 1543,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:34:38.921Z",
|
||
"passed": false,
|
||
"duration": 30009,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:137:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:34:44.095Z",
|
||
"passed": false,
|
||
"duration": 5171,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:34:46.111Z",
|
||
"passed": true,
|
||
"duration": 2012,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:34:52.001Z",
|
||
"passed": true,
|
||
"duration": 5888,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:34:52.968Z",
|
||
"passed": true,
|
||
"duration": 964,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:34:54.051Z",
|
||
"passed": true,
|
||
"duration": 1080,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:35:04.364Z",
|
||
"passed": true,
|
||
"duration": 10309,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:35:10.480Z",
|
||
"passed": true,
|
||
"duration": 6114,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:35:11.619Z",
|
||
"passed": true,
|
||
"duration": 1136,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:35:19.194Z",
|
||
"passed": true,
|
||
"duration": 7572,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:35:20.455Z",
|
||
"passed": true,
|
||
"duration": 1259,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:35:21.956Z",
|
||
"passed": true,
|
||
"duration": 1498,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:35:27.372Z",
|
||
"passed": true,
|
||
"duration": 5414,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:35:37.266Z",
|
||
"passed": true,
|
||
"duration": 9891,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:36:22.644Z",
|
||
"passed": false,
|
||
"duration": 1358,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:36:31.987Z",
|
||
"passed": false,
|
||
"duration": 1375,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:37:00.757Z",
|
||
"passed": false,
|
||
"duration": 1589,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:37:38.502Z",
|
||
"passed": false,
|
||
"duration": 2344,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:37:51.538Z",
|
||
"passed": false,
|
||
"duration": 2010,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:37:59.511Z",
|
||
"passed": false,
|
||
"duration": 1399,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:39:33.082Z",
|
||
"passed": false,
|
||
"duration": 1792,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:40:21.065Z",
|
||
"passed": false,
|
||
"duration": 1221,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:40:47.110Z",
|
||
"passed": false,
|
||
"duration": 2367,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-3, -2"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:40:56.377Z",
|
||
"passed": false,
|
||
"duration": 9259,
|
||
"reason": "Expected -3,-2, but got -3, -2",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:40:57.391Z",
|
||
"passed": false,
|
||
"duration": 1010,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:40:58.209Z",
|
||
"passed": false,
|
||
"duration": 815,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:41:02.148Z",
|
||
"passed": false,
|
||
"duration": 3934,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"The solutions to the equation x² + 5x + 6 = 0 are -2 and -3.\n\n-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:41:10.265Z",
|
||
"passed": false,
|
||
"duration": 8112,
|
||
"reason": "Expected -3,-2, but got the solutions to the equation x² + 5x + 6 = 0 are -2 and -3.\n\n-2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:41:11.723Z",
|
||
"passed": true,
|
||
"duration": 1454,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:41:21.969Z",
|
||
"passed": true,
|
||
"duration": 10242,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:41:22.848Z",
|
||
"passed": true,
|
||
"duration": 876,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:41:23.636Z",
|
||
"passed": true,
|
||
"duration": 785,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:41:30.847Z",
|
||
"passed": true,
|
||
"duration": 7208,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"5! is equal to 120. \n\nAnswer: 120"
|
||
],
|
||
"expected": "120",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:41:34.615Z",
|
||
"passed": false,
|
||
"duration": 3765,
|
||
"reason": "Expected 120, but got 5! is equal to 120. \n\nanswer: 120",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:41:36.384Z",
|
||
"passed": true,
|
||
"duration": 1765,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:41:56.369Z",
|
||
"passed": false,
|
||
"duration": 19981,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:41:57.522Z",
|
||
"passed": true,
|
||
"duration": 1149,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:41:58.423Z",
|
||
"passed": true,
|
||
"duration": 898,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:42:28.442Z",
|
||
"passed": false,
|
||
"duration": 30014,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:42:33.805Z",
|
||
"passed": false,
|
||
"duration": 5358,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:42:34.628Z",
|
||
"passed": true,
|
||
"duration": 819,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:42:35.522Z",
|
||
"passed": true,
|
||
"duration": 890,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:42:36.791Z",
|
||
"passed": true,
|
||
"duration": 1266,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:42:37.938Z",
|
||
"passed": true,
|
||
"duration": 1144,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:42:42.967Z",
|
||
"passed": true,
|
||
"duration": 5026,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:42:51.135Z",
|
||
"passed": true,
|
||
"duration": 8165,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:42:52.650Z",
|
||
"passed": true,
|
||
"duration": 1512,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:42:57.896Z",
|
||
"passed": true,
|
||
"duration": 5243,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:42:58.774Z",
|
||
"passed": true,
|
||
"duration": 875,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:42:59.643Z",
|
||
"passed": true,
|
||
"duration": 866,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:43:13.962Z",
|
||
"passed": false,
|
||
"duration": 1435,
|
||
"reason": "Expected -3,-2, but got -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:43:39.174Z",
|
||
"passed": false,
|
||
"duration": 25202,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:43:40.474Z",
|
||
"passed": false,
|
||
"duration": 1295,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-3, -2"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:43:41.957Z",
|
||
"passed": false,
|
||
"duration": 1478,
|
||
"reason": "Expected -3,-2, but got -3, -2",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:44:06.429Z",
|
||
"passed": true,
|
||
"duration": 1689,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:44:10.240Z",
|
||
"passed": true,
|
||
"duration": 3807,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:44:11.128Z",
|
||
"passed": true,
|
||
"duration": 885,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:44:21.587Z",
|
||
"passed": true,
|
||
"duration": 10455,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:44:33.654Z",
|
||
"passed": true,
|
||
"duration": 12064,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"The sum of 5 and 3 is 8. Therefore, the result is \\boxed{8}."
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:44:40.062Z",
|
||
"passed": false,
|
||
"duration": 6405,
|
||
"reason": "Expected 8, but got the sum of 5 and 3 is 8. therefore, the result is \\boxed{8}.",
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:44:41.261Z",
|
||
"passed": true,
|
||
"duration": 1190,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:44:46.272Z",
|
||
"passed": true,
|
||
"duration": 5008,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:44:47.386Z",
|
||
"passed": true,
|
||
"duration": 1111,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:44:48.372Z",
|
||
"passed": true,
|
||
"duration": 984,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24\n\n24\n\nThe result is 24.\n\n24\n\nHere's the answer: 24\n\nThe answer will be 24.\n\n24\n\n24\n\nThe product of 8 and 3 is 24.\n\n24\n\nThe answer is 24.\n\n24\n\n24\n\n24\n\nThe result is 24.\n\n24\n\nHere's the numerical result: 24\n\nThe answer is 24.\n\n24\n\n24\n\nThe answer is 24."
|
||
],
|
||
"expected": "24",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:44:53.633Z",
|
||
"passed": false,
|
||
"duration": 5258,
|
||
"reason": "Expected 24, but got 24\n\n24\n\nthe result is 24.\n\n24\n\nhere's the answer: 24\n\nthe answer will be 24.\n\n24\n\n24\n\nthe product of 8 and 3 is 24.\n\n24\n\nthe answer is 24.\n\n24\n\n24\n\n24\n\nthe result is 24.\n\n24\n\nhere's the numerical result: 24\n\nthe answer is 24.\n\n24\n\n24\n\nthe answer is 24.",
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:44:55.196Z",
|
||
"passed": true,
|
||
"duration": 1558,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:44:56.604Z",
|
||
"passed": true,
|
||
"duration": 1405,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:44:57.523Z",
|
||
"passed": true,
|
||
"duration": 917,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:44:58.630Z",
|
||
"passed": true,
|
||
"duration": 1104,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:44:59.523Z",
|
||
"passed": true,
|
||
"duration": 889,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:45:06.658Z",
|
||
"passed": true,
|
||
"duration": 7130,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:45:10.307Z",
|
||
"passed": true,
|
||
"duration": 3646,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Roman architecture, Vatican tourism, Colosseum history, Italian cultural heritage"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:53:58.867Z",
|
||
"passed": false,
|
||
"duration": 1756,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, roman architecture, vatican tourism, colosseum history, italian cultural heritage",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:54:28.879Z",
|
||
"passed": false,
|
||
"duration": 30008,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Rome tourism, Colosseum history, Roman Forum attractions, Vatican City travel, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:54:30.304Z",
|
||
"passed": false,
|
||
"duration": 1417,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got rome tourism, colosseum history, roman forum attractions, vatican city travel, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, Colosseum, Roman Forum, Vatican City, history, art, culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:54:32.272Z",
|
||
"passed": false,
|
||
"duration": 1965,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, colosseum, roman forum, vatican city, history, art, culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:54:48.242Z",
|
||
"passed": false,
|
||
"duration": 15967,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Rome, Colosseum, Roman Forum, Vatican City, History of Rome"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:54:53.813Z",
|
||
"passed": false,
|
||
"duration": 5568,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got rome, colosseum, roman forum, vatican city, history of rome",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical learning, automated data analysis, predictive modeling, artificial intelligence training"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:54:55.134Z",
|
||
"passed": false,
|
||
"duration": 1318,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical learning, automated data analysis, predictive modeling, artificial intelligence training",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:55:25.143Z",
|
||
"passed": false,
|
||
"duration": 30006,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning, algorithms, statistical methods, data analysis, performance improvement"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:55:26.487Z",
|
||
"passed": false,
|
||
"duration": 1341,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning, algorithms, statistical methods, data analysis, performance improvement",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine learning algorithms, statistical methods, computers, data, performance"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:55:27.413Z",
|
||
"passed": false,
|
||
"duration": 924,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, data, performance",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods in machine learning, data-driven performance improvement, automated computer learning, self-improving algorithms"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:55:31.262Z",
|
||
"passed": false,
|
||
"duration": 3846,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods in machine learning, data-driven performance improvement, automated computer learning, self-improving algorithms",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine learning algorithms, statistical methods, data learning, automated learning, self-improving systems"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:55:38.627Z",
|
||
"passed": false,
|
||
"duration": 7362,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, data learning, automated learning, self-improving systems",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Ancient Rome, Roman architecture, Vatican City attractions, Colosseum tourism, Roman Forum history"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:57:14.773Z",
|
||
"passed": false,
|
||
"duration": 2756,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, roman architecture, vatican city attractions, colosseum tourism, roman forum history",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Roman Colosseum, Vatican City attractions, Roman Forum ruins, historical landmarks Rome"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:57:46.922Z",
|
||
"passed": false,
|
||
"duration": 1364,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, roman colosseum, vatican city attractions, roman forum ruins, historical landmarks rome",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome tourism, Roman architecture landmarks, Vatican City attractions, historic Roman sites, Colosseum Rome"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:58:14.587Z",
|
||
"passed": false,
|
||
"duration": 2624,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome tourism, roman architecture landmarks, vatican city attractions, historic roman sites, colosseum rome",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:58:44.596Z",
|
||
"passed": false,
|
||
"duration": 30004,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:58:46.039Z",
|
||
"passed": false,
|
||
"duration": 1435,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city, Rome, Colosseum, history, art"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:58:47.063Z",
|
||
"passed": false,
|
||
"duration": 1019,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city, rome, colosseum, history, art",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, Colosseum, Roman Forum, Vatican City, Rome history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T13:59:00.408Z",
|
||
"passed": false,
|
||
"duration": 13342,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, colosseum, roman forum, vatican city, rome history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Rome, Colosseum, Roman Forum, Vatican City, History, Art, Culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T13:59:05.427Z",
|
||
"passed": false,
|
||
"duration": 5015,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got rome, colosseum, roman forum, vatican city, history, art, culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning, statistical analysis, data science, predictive algorithms, automated learning"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T13:59:07.120Z",
|
||
"passed": false,
|
||
"duration": 1689,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning, statistical analysis, data science, predictive algorithms, automated learning",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T13:59:37.128Z",
|
||
"passed": false,
|
||
"duration": 30005,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, data analysis, improve performance, computer learning"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T13:59:38.643Z",
|
||
"passed": false,
|
||
"duration": 1510,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, data analysis, improve performance, computer learning",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine learning algorithms, statistical methods, computers, improve performance, data"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T13:59:40.004Z",
|
||
"passed": false,
|
||
"duration": 1358,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, improve performance, data",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:00:10.018Z",
|
||
"passed": false,
|
||
"duration": 30011,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine Learning, Algorithms, Statistical Methods, Learning from Data, Improving Performance"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:00:17.625Z",
|
||
"passed": false,
|
||
"duration": 7604,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning, algorithms, statistical methods, learning from data, improving performance",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Ancient Rome, Roman architecture, Vatican City attractions, Colosseum tourism, Roman Forum history"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:03:54.017Z",
|
||
"passed": false,
|
||
"duration": 2676,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, roman architecture, vatican city attractions, colosseum tourism, roman forum history",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:03:59.025Z",
|
||
"passed": false,
|
||
"duration": 5002,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Colosseum, Roman Forum, Vatican City, history and culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:04:00.133Z",
|
||
"passed": false,
|
||
"duration": 1099,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, colosseum, roman forum, vatican city, history and culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city, Rome, Colosseum, Vatican City, history"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:04:01.480Z",
|
||
"passed": false,
|
||
"duration": 1343,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city, rome, colosseum, vatican city, history",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:04:06.485Z",
|
||
"passed": false,
|
||
"duration": 5002,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:04:11.505Z",
|
||
"passed": false,
|
||
"duration": 5015,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning, statistical analysis, data-driven algorithms, automated learning, predictive modeling"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:04:12.607Z",
|
||
"passed": false,
|
||
"duration": 1098,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning, statistical analysis, data-driven algorithms, automated learning, predictive modeling",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods learning, data-driven learning systems, adaptive algorithms performance, self-improving machine learning"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:04:15.471Z",
|
||
"passed": false,
|
||
"duration": 2860,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods learning, data-driven learning systems, adaptive algorithms performance, self-improving machine learning",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, computers learn from data, improve performance, explicitly programmed"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:04:16.984Z",
|
||
"passed": false,
|
||
"duration": 1510,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers learn from data, improve performance, explicitly programmed",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, computers, data, performance"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:04:18.098Z",
|
||
"passed": false,
|
||
"duration": 1110,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, data, performance",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:04:23.114Z",
|
||
"passed": false,
|
||
"duration": 5013,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine Learning Algorithms, Statistical Methods in Machine Learning, Self-Improving AI Algorithms, Data-Driven Machine Learning, Efficient Performance Improvement."
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:04:27.907Z",
|
||
"passed": false,
|
||
"duration": 4788,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods in machine learning, self-improving ai algorithms, data-driven machine learning, efficient performance improvement.",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Ancient Rome, Roman architecture, Vatican tourism, Colosseum history, Italian cultural heritage"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:06:10.947Z",
|
||
"passed": false,
|
||
"duration": 2261,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, roman architecture, vatican tourism, colosseum history, italian cultural heritage",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:06:15.957Z",
|
||
"passed": false,
|
||
"duration": 5005,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:06:17.129Z",
|
||
"passed": false,
|
||
"duration": 1164,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:06:19.075Z",
|
||
"passed": false,
|
||
"duration": 1943,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:06:24.095Z",
|
||
"passed": false,
|
||
"duration": 5016,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:06:29.106Z",
|
||
"passed": false,
|
||
"duration": 5006,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical analysis, data-driven learning, automated pattern recognition, performance optimization"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:06:31.194Z",
|
||
"passed": false,
|
||
"duration": 2083,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical analysis, data-driven learning, automated pattern recognition, performance optimization",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:06:36.201Z",
|
||
"passed": false,
|
||
"duration": 5003,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, computers learn from data, improve performance, explicit programming"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:06:37.581Z",
|
||
"passed": false,
|
||
"duration": 1376,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers learn from data, improve performance, explicit programming",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine learning algorithms, statistical methods, computers, data, performance."
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:06:38.721Z",
|
||
"passed": false,
|
||
"duration": 1136,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, data, performance.",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:06:43.735Z",
|
||
"passed": false,
|
||
"duration": 5010,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:06:48.743Z",
|
||
"passed": false,
|
||
"duration": 5004,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Roman Colosseum, Vatican City tourism, Roman Forum ruins, historic Rome landmarks"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:08:18.282Z",
|
||
"passed": false,
|
||
"duration": 1556,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, roman colosseum, vatican city tourism, roman forum ruins, historic rome landmarks",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:08:23.302Z",
|
||
"passed": false,
|
||
"duration": 5014,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:08:24.515Z",
|
||
"passed": false,
|
||
"duration": 1203,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, magnificent Colosseum, historic Roman Forum, stunning Vatican City, blend of history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:08:25.485Z",
|
||
"passed": false,
|
||
"duration": 966,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, magnificent colosseum, historic roman forum, stunning vatican city, blend of history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:08:30.500Z",
|
||
"passed": false,
|
||
"duration": 5012,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:08:35.518Z",
|
||
"passed": false,
|
||
"duration": 5012,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning basics, statistical algorithms, data-driven learning, automated programming, computer performance optimization"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:08:37.665Z",
|
||
"passed": false,
|
||
"duration": 2142,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning basics, statistical algorithms, data-driven learning, automated programming, computer performance optimization",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine Learning Algorithms,Statistical Methods in AI,Data-Driven Learning Systems,Automated Performance Improvement,Self-Improving Algorithms"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:08:38.848Z",
|
||
"passed": false,
|
||
"duration": 1179,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms,statistical methods in ai,data-driven learning systems,automated performance improvement,self-improving algorithms",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, improve performance, data-driven learning, computer programming"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:08:40.193Z",
|
||
"passed": false,
|
||
"duration": 1339,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, improve performance, data-driven learning, computer programming",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine learning algorithms, statistical methods, computers, data, performance"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:08:41.233Z",
|
||
"passed": false,
|
||
"duration": 1036,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, data, performance",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, learning from data, performance improvement over time, unprogrammed computer learning"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:08:44.151Z",
|
||
"passed": false,
|
||
"duration": 2914,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, learning from data, performance improvement over time, unprogrammed computer learning",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:08:49.167Z",
|
||
"passed": false,
|
||
"duration": 5012,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Roman Empire history, Colosseum tourism, Vatican City attractions, Roman Forum landmarks"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:09:37.561Z",
|
||
"passed": false,
|
||
"duration": 2041,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, roman empire history, colosseum tourism, vatican city attractions, roman forum landmarks",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:09:42.582Z",
|
||
"passed": false,
|
||
"duration": 5014,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:09:44.349Z",
|
||
"passed": false,
|
||
"duration": 1757,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:09:45.432Z",
|
||
"passed": false,
|
||
"duration": 1079,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:09:50.446Z",
|
||
"passed": false,
|
||
"duration": 5010,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Rome, Colosseum, Roman Forum, Vatican City, History"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:09:55.444Z",
|
||
"passed": false,
|
||
"duration": 4992,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got rome, colosseum, roman forum, vatican city, history",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical data analysis, automated learning systems, predictive modeling, data-driven programming"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:09:57.245Z",
|
||
"passed": false,
|
||
"duration": 1796,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical data analysis, automated learning systems, predictive modeling, data-driven programming",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:10:02.263Z",
|
||
"passed": false,
|
||
"duration": 5013,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, computers learning from data, improve performance over time, explicit programming"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:10:04.357Z",
|
||
"passed": false,
|
||
"duration": 2089,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers learning from data, improve performance over time, explicit programming",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine learning algorithms, statistical methods, computers, data, performance"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:10:05.365Z",
|
||
"passed": false,
|
||
"duration": 1003,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, data, performance",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:10:10.381Z",
|
||
"passed": false,
|
||
"duration": 5012,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:10:15.395Z",
|
||
"passed": false,
|
||
"duration": 5009,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Roman Colosseum, Vatican City tourism, historic Roman Forum, Rome cultural attractions"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:10:49.147Z",
|
||
"passed": false,
|
||
"duration": 2477,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, roman colosseum, vatican city tourism, historic roman forum, rome cultural attractions",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:10:54.164Z",
|
||
"passed": false,
|
||
"duration": 5011,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Colosseum, Roman Forum, Vatican City, history and culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:10:55.469Z",
|
||
"passed": false,
|
||
"duration": 1296,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, colosseum, roman forum, vatican city, history and culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, Colosseum, Roman Forum, Vatican City, history, art, culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:10:56.445Z",
|
||
"passed": false,
|
||
"duration": 971,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, colosseum, roman forum, vatican city, history, art, culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:11:01.460Z",
|
||
"passed": false,
|
||
"duration": 5011,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:11:06.481Z",
|
||
"passed": false,
|
||
"duration": 5015,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical analysis, data-driven learning, automated programming, predictive modeling"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:11:07.998Z",
|
||
"passed": false,
|
||
"duration": 1512,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical analysis, data-driven learning, automated programming, predictive modeling",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:11:13.011Z",
|
||
"passed": false,
|
||
"duration": 5008,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, improve performance, learn from data, explicit programming"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:11:14.348Z",
|
||
"passed": false,
|
||
"duration": 1332,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, improve performance, learn from data, explicit programming",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine learning algorithms, statistical methods, computers, data, improve performance"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:11:16.146Z",
|
||
"passed": false,
|
||
"duration": 1794,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, data, improve performance",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:11:21.158Z",
|
||
"passed": false,
|
||
"duration": 5009,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:11:26.168Z",
|
||
"passed": false,
|
||
"duration": 5004,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Roman Colosseum, Vatican City, Roman Forum, historic Italian landmarks"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:12:21.933Z",
|
||
"passed": false,
|
||
"duration": 1921,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, roman colosseum, vatican city, roman forum, historic italian landmarks",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:12:26.952Z",
|
||
"passed": false,
|
||
"duration": 5012,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Roman Colosseum, Vatican City tours, Roman Forum ruins, historic Rome attractions"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:12:37.437Z",
|
||
"passed": false,
|
||
"duration": 2438,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, roman colosseum, vatican city tours, roman forum ruins, historic rome attractions",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:12:42.449Z",
|
||
"passed": false,
|
||
"duration": 5005,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome tourism, Colosseum history, Roman Forum visitors, Vatican City attractions, Rome art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:12:43.676Z",
|
||
"passed": false,
|
||
"duration": 1212,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome tourism, colosseum history, roman forum visitors, vatican city attractions, rome art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, magnificent Colosseum, historic Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:12:44.912Z",
|
||
"passed": false,
|
||
"duration": 1231,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, magnificent colosseum, historic roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:12:49.919Z",
|
||
"passed": false,
|
||
"duration": 5002,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:12:54.939Z",
|
||
"passed": false,
|
||
"duration": 5013,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning, statistical analysis, data-driven algorithms, automated learning systems, predictive modeling"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:12:56.470Z",
|
||
"passed": false,
|
||
"duration": 1525,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning, statistical analysis, data-driven algorithms, automated learning systems, predictive modeling",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:13:01.489Z",
|
||
"passed": false,
|
||
"duration": 5013,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning, algorithms, statistical methods, data analysis, improve performance"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:13:02.739Z",
|
||
"passed": false,
|
||
"duration": 1244,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning, algorithms, statistical methods, data analysis, improve performance",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine learning algorithms, statistical methods, computers, learn from data, improve performance."
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:13:03.946Z",
|
||
"passed": false,
|
||
"duration": 1201,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, learn from data, improve performance.",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, data-driven learning, performance improvement, automated machine learning"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:13:08.709Z",
|
||
"passed": false,
|
||
"duration": 4759,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, data-driven learning, performance improvement, automated machine learning",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:13:13.723Z",
|
||
"passed": false,
|
||
"duration": 5008,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:176:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Roman architecture, Vatican tourism, Colosseum landmarks, historical monuments"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:15:10.989Z",
|
||
"passed": false,
|
||
"duration": 1931,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, roman architecture, vatican tourism, colosseum landmarks, historical monuments",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:15:16.002Z",
|
||
"passed": false,
|
||
"duration": 5007,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:15:17.078Z",
|
||
"passed": false,
|
||
"duration": 1064,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:15:18.626Z",
|
||
"passed": false,
|
||
"duration": 1543,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:15:23.647Z",
|
||
"passed": false,
|
||
"duration": 5017,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:15:28.670Z",
|
||
"passed": false,
|
||
"duration": 5016,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical analysis, data-driven learning, automated model training, predictive analytics"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:15:30.797Z",
|
||
"passed": false,
|
||
"duration": 2120,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical analysis, data-driven learning, automated model training, predictive analytics",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:15:35.817Z",
|
||
"passed": false,
|
||
"duration": 5015,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, optimize performance, computer learning, data improvement"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:15:37.800Z",
|
||
"passed": false,
|
||
"duration": 1975,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, optimize performance, computer learning, data improvement",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, computers, data, performance"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:15:39.068Z",
|
||
"passed": false,
|
||
"duration": 1262,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, data, performance",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:15:44.079Z",
|
||
"passed": false,
|
||
"duration": 5005,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine Learning Algorithms, Statistical Methods, Data-Driven Learning, Automated Improvement, Unsupervised Programming"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:15:48.388Z",
|
||
"passed": false,
|
||
"duration": 4303,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, data-driven learning, automated improvement, unsupervised programming",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Ancient Rome tourism, Roman Colosseum attractions, Vatican City sightseeing, historic Roman Forum, Rome cultural landmarks"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:18:01.333Z",
|
||
"passed": false,
|
||
"duration": 1981,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome tourism, roman colosseum attractions, vatican city sightseeing, historic roman forum, rome cultural landmarks",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:18:06.353Z",
|
||
"passed": false,
|
||
"duration": 5013,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome tourism, Colosseum attractions, Roman Forum history, Vatican City art, Rome cultural experiences"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:18:07.939Z",
|
||
"passed": false,
|
||
"duration": 1576,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome tourism, colosseum attractions, roman forum history, vatican city art, rome cultural experiences",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:18:09.011Z",
|
||
"passed": false,
|
||
"duration": 1068,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:18:14.019Z",
|
||
"passed": false,
|
||
"duration": 5004,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, Colosseum, Roman Forum, Vatican City, Italian history"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:18:18.278Z",
|
||
"passed": false,
|
||
"duration": 4253,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, colosseum, roman forum, vatican city, italian history",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning, statistical analysis, data science, artificial intelligence, predictive algorithms"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:18:19.203Z",
|
||
"passed": false,
|
||
"duration": 920,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning, statistical analysis, data science, artificial intelligence, predictive algorithms",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:18:24.214Z",
|
||
"passed": false,
|
||
"duration": 5005,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, computers learn from data, improve performance, explicit programming"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:18:25.284Z",
|
||
"passed": false,
|
||
"duration": 1065,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers learn from data, improve performance, explicit programming",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine learning algorithms, statistical methods, computers, improve performance, data"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:18:28.908Z",
|
||
"passed": false,
|
||
"duration": 3619,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, improve performance, data",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:18:33.928Z",
|
||
"passed": false,
|
||
"duration": 5015,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:18:38.942Z",
|
||
"passed": false,
|
||
"duration": 5009,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome tourism, Roman Colosseum attractions, Vatican City landmarks, historic Roman Forum, Rome cultural heritage"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:19:46.962Z",
|
||
"passed": false,
|
||
"duration": 2552,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome tourism, roman colosseum attractions, vatican city landmarks, historic roman forum, rome cultural heritage",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:19:51.972Z",
|
||
"passed": false,
|
||
"duration": 5003,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome tourism, Colosseum visitors guide, Roman Forum history, Vatican City travel tips, Rome art and culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:19:53.129Z",
|
||
"passed": false,
|
||
"duration": 1147,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome tourism, colosseum visitors guide, roman forum history, vatican city travel tips, rome art and culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:19:54.207Z",
|
||
"passed": false,
|
||
"duration": 1073,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:19:59.229Z",
|
||
"passed": false,
|
||
"duration": 5017,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:20:04.243Z",
|
||
"passed": false,
|
||
"duration": 5008,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical analysis, data-driven learning, automated programming, computer performance optimization"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:20:05.931Z",
|
||
"passed": false,
|
||
"duration": 1682,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical analysis, data-driven learning, automated programming, computer performance optimization",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:20:10.946Z",
|
||
"passed": false,
|
||
"duration": 5010,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, data analysis, computer learning, algorithm performance"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:20:12.421Z",
|
||
"passed": false,
|
||
"duration": 1470,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, data analysis, computer learning, algorithm performance",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine learning algorithms, statistical methods, computers, data, performance."
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:20:13.722Z",
|
||
"passed": false,
|
||
"duration": 1296,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, data, performance.",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:20:18.741Z",
|
||
"passed": false,
|
||
"duration": 5014,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:20:23.749Z",
|
||
"passed": false,
|
||
"duration": 5002,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Roman architecture, Vatican tourism, Colosseum history, Italian cultural heritage"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:21:38.678Z",
|
||
"passed": false,
|
||
"duration": 1437,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, roman architecture, vatican tourism, colosseum history, italian cultural heritage",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome,Colosseum,Roman Forum,Vatican City,history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:21:40.263Z",
|
||
"passed": false,
|
||
"duration": 1577,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome,colosseum,roman forum,vatican city,history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:21:41.195Z",
|
||
"passed": false,
|
||
"duration": 926,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:21:43.283Z",
|
||
"passed": false,
|
||
"duration": 2083,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:21:48.295Z",
|
||
"passed": false,
|
||
"duration": 5006,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Colosseum, Roman Forum, Vatican City, ancient Rome, cultural heritage"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:21:53.227Z",
|
||
"passed": false,
|
||
"duration": 4923,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got colosseum, roman forum, vatican city, ancient rome, cultural heritage",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning techniques, statistical algorithms, data-driven learning, automated pattern recognition, AI training methods"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:21:54.430Z",
|
||
"passed": false,
|
||
"duration": 1198,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning techniques, statistical algorithms, data-driven learning, automated pattern recognition, ai training methods",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:21:59.447Z",
|
||
"passed": false,
|
||
"duration": 5011,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, improve performance, learn from data, explicit programming"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:22:01.398Z",
|
||
"passed": false,
|
||
"duration": 1946,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, improve performance, learn from data, explicit programming",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, computers, data, performance"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:22:02.526Z",
|
||
"passed": false,
|
||
"duration": 1121,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, data, performance",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:22:07.546Z",
|
||
"passed": false,
|
||
"duration": 5015,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:22:12.566Z",
|
||
"passed": false,
|
||
"duration": 5014,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome tourism, Roman Colosseum landmarks, Vatican City attractions, historic Roman Forum, Rome cultural heritage"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:24:05.501Z",
|
||
"passed": false,
|
||
"duration": 2224,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome tourism, roman colosseum landmarks, vatican city attractions, historic roman forum, rome cultural heritage",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:24:10.522Z",
|
||
"passed": false,
|
||
"duration": 5014,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Rome tourism, Colosseum history, Roman Forum attractions, Vatican City art, ancient Roman culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:24:11.691Z",
|
||
"passed": false,
|
||
"duration": 1159,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got rome tourism, colosseum history, roman forum attractions, vatican city art, ancient roman culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:24:16.700Z",
|
||
"passed": false,
|
||
"duration": 5003,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:24:21.709Z",
|
||
"passed": false,
|
||
"duration": 5002,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Rome, Colosseum, Roman Forum, Vatican City, history, art, culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:24:26.091Z",
|
||
"passed": false,
|
||
"duration": 4375,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got rome, colosseum, roman forum, vatican city, history, art, culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical analysis, data-driven learning, automated programming, AI model training"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:24:27.364Z",
|
||
"passed": false,
|
||
"duration": 1268,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical analysis, data-driven learning, automated programming, ai model training",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:24:32.386Z",
|
||
"passed": false,
|
||
"duration": 5016,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, computers learn from data, improve performance, explicit programming"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:24:33.642Z",
|
||
"passed": false,
|
||
"duration": 1251,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers learn from data, improve performance, explicit programming",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine learning algorithms, statistical methods, computers, data, performance"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:24:34.602Z",
|
||
"passed": false,
|
||
"duration": 954,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, data, performance",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, data-driven learning, automated performance improvement, self-improving algorithms"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:24:39.037Z",
|
||
"passed": false,
|
||
"duration": 4430,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, data-driven learning, automated performance improvement, self-improving algorithms",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:24:44.055Z",
|
||
"passed": false,
|
||
"duration": 5011,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Colosseum tourism, Roman Forum attractions, Vatican City sightseeing, historic Rome landmarks"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:24:58.096Z",
|
||
"passed": false,
|
||
"duration": 1719,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, colosseum tourism, roman forum attractions, vatican city sightseeing, historic rome landmarks",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:25:03.115Z",
|
||
"passed": false,
|
||
"duration": 5013,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient Rome, Colosseum, Roman Forum, Vatican City, history art culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:25:04.665Z",
|
||
"passed": false,
|
||
"duration": 1539,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient rome, colosseum, roman forum, vatican city, history art culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"ancient city of Rome, Colosseum, Roman Forum, Vatican City, history, art, culture"
|
||
],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:25:05.673Z",
|
||
"passed": false,
|
||
"duration": 1002,
|
||
"reason": "Expected Rome, Colosseum, Roman Forum, Vatican City, ancient history, but got ancient city of rome, colosseum, roman forum, vatican city, history, art, culture",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:25:10.689Z",
|
||
"passed": false,
|
||
"duration": 5011,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"The ancient city of Rome, with its magnificent Colosseum, historic Roman Forum, and stunning Vatican City, offers visitors a unique blend of history, art, and culture.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "Rome, Colosseum, Roman Forum, Vatican City, ancient history",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:25:15.703Z",
|
||
"passed": false,
|
||
"duration": 5007,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical learning, data science, automated learning, predictive modeling"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"router": "anthropic/claude-3.5-sonnet",
|
||
"timestamp": "2025-04-02T14:25:17.540Z",
|
||
"passed": false,
|
||
"duration": 1830,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical learning, data science, automated learning, predictive modeling",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "qwen/qwq-32b",
|
||
"router": "qwen/qwq-32b",
|
||
"timestamp": "2025-04-02T14:25:22.559Z",
|
||
"passed": false,
|
||
"duration": 5012,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"machine learning algorithms, statistical methods, computer learning, data improvement, performance enhancement"
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T14:25:24.259Z",
|
||
"passed": false,
|
||
"duration": 1694,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computer learning, data improvement, performance enhancement",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [
|
||
"Machine learning algorithms, statistical methods, computers, data, performance."
|
||
],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T14:25:25.146Z",
|
||
"passed": false,
|
||
"duration": 881,
|
||
"reason": "Expected machine learning, algorithms, artificial intelligence, data science, statistical methods, but got machine learning algorithms, statistical methods, computers, data, performance.",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1",
|
||
"router": "deepseek/deepseek-r1",
|
||
"timestamp": "2025-04-02T14:25:30.156Z",
|
||
"passed": false,
|
||
"duration": 5005,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"prompt": "Generate 5 SEO keywords for this text: \"Machine learning algorithms use statistical methods to enable computers to learn from data and improve their performance over time without being explicitly programmed.\" Return only the keywords separated by commas, no explanation.",
|
||
"result": [],
|
||
"expected": "machine learning, algorithms, artificial intelligence, data science, statistical methods",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T14:25:35.171Z",
|
||
"passed": false,
|
||
"duration": 5008,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:138:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "seo"
|
||
},
|
||
{
|
||
"test": "equation_solving",
|
||
"prompt": "Read the file at C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\tools.test.md and solve all equations. Return the results in the specified JSON format.",
|
||
"result": [],
|
||
"expected": "[{\"equation\":\"2x + 5 = 13\",\"result\":\"4\"},{\"equation\":\"3y - 7 = 20\",\"result\":\"9\"},{\"equation\":\"4z + 8 = 32\",\"result\":\"6\"}]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:20:14.739Z",
|
||
"passed": false,
|
||
"duration": 5009,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:182:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "file_operations",
|
||
"prompt": "Write the following data to C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\test-data.json and then read it back: {\"test\":\"data\",\"timestamp\":\"2025-04-02T19:20:14.746Z\"}. Return the read data in JSON format.",
|
||
"result": [],
|
||
"expected": "{\"test\":\"data\",\"timestamp\":\"2025-04-02T19:20:14.746Z\"}",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:20:19.753Z",
|
||
"passed": false,
|
||
"duration": 5007,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:182:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "directory_listing",
|
||
"prompt": "List all files in the directory C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot. Return the list as a JSON array of filenames.",
|
||
"result": [],
|
||
"expected": "[]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:20:24.772Z",
|
||
"passed": false,
|
||
"duration": 5014,
|
||
"error": {
|
||
"message": "API call timed out",
|
||
"code": "UNKNOWN",
|
||
"type": "Error",
|
||
"details": {
|
||
"stack": "Error: API call timed out\n at Timeout._onTimeout (C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\commons.ts:182:33)\n at listOnTimeout (node:internal/timers:594:17)\n at processTimers (node:internal/timers:529:7)",
|
||
"message": "API call timed out"
|
||
}
|
||
},
|
||
"reason": "API call timed out",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "equation_solving",
|
||
"prompt": "Read the file at C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\tools.test.md and solve all equations. Return the results in the specified JSON format.",
|
||
"result": [
|
||
"Please specify the the JSON format you want the results in."
|
||
],
|
||
"expected": "[{\"equation\":\"2x + 5 = 13\",\"result\":\"4\"},{\"equation\":\"3y - 7 = 20\",\"result\":\"9\"},{\"equation\":\"4z + 8 = 32\",\"result\":\"6\"}]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:22:06.731Z",
|
||
"passed": false,
|
||
"duration": 4124,
|
||
"reason": "Expected [{\"equation\":\"2x + 5 = 13\",\"result\":\"4\"},{\"equation\":\"3y - 7 = 20\",\"result\":\"9\"},{\"equation\":\"4z + 8 = 32\",\"result\":\"6\"}], but got please specify the the json format you want the results in.",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "file_operations",
|
||
"prompt": "Write the following data to C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data\\test-data.json and then read it back: {\"test\":\"data\",\"timestamp\":\"2025-04-02T19:22:06.737Z\"}. Return the read data in JSON format.",
|
||
"result": [
|
||
"Here's the data read from the file:\n\n```json\n{\"test\":\"data\",\"timestamp\":\"2025-04-02T19:22:06.737Z\"}\n```"
|
||
],
|
||
"expected": "{\"test\":\"data\",\"timestamp\":\"2025-04-02T19:22:06.737Z\"}",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:22:12.607Z",
|
||
"passed": false,
|
||
"duration": 5870,
|
||
"reason": "Expected {\"test\":\"data\",\"timestamp\":\"2025-04-02T19:22:06.737Z\"}, but got here's the data read from the file:\n\n```json\n{\"test\":\"data\",\"timestamp\":\"2025-04-02t19:22:06.737z\"}\n```",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "directory_listing",
|
||
"prompt": "List all files in the directory C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data. Return the list as a JSON array of filenames.",
|
||
"result": [
|
||
"It seems there is an issue retrieving the list of files. Please ensure the directory path is correct and accessible. If you have any other requests, feel free to let me know!"
|
||
],
|
||
"expected": "[]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:22:17.893Z",
|
||
"passed": false,
|
||
"duration": 5282,
|
||
"reason": "Expected [], but got it seems there is an issue retrieving the list of files. please ensure the directory path is correct and accessible. if you have any other requests, feel free to let me know!",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "equation_solving",
|
||
"prompt": "Read the file at C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\tools.test.md and solve all equations. Return the results in the specified JSON format.",
|
||
"result": [
|
||
"I attempted to read the file but it seems there might be an access issue or the file does not exist. Could you please check the file path or provide access details?"
|
||
],
|
||
"expected": "[{\"equation\":\"2x + 5 = 13\",\"result\":\"4\"},{\"equation\":\"3y - 7 = 20\",\"result\":\"9\"},{\"equation\":\"4z + 8 = 32\",\"result\":\"6\"}]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:23:59.211Z",
|
||
"passed": false,
|
||
"duration": 4000,
|
||
"reason": "Expected [{\"equation\":\"2x + 5 = 13\",\"result\":\"4\"},{\"equation\":\"3y - 7 = 20\",\"result\":\"9\"},{\"equation\":\"4z + 8 = 32\",\"result\":\"6\"}], but got i attempted to read the file but it seems there might be an access issue or the file does not exist. could you please check the file path or provide access details?",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "file_operations",
|
||
"prompt": "Write the following data to C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data\\test-data.json and then read it back: {\"test\":\"data\",\"timestamp\":\"2025-04-02T19:23:59.217Z\"}. Return the read data in JSON format.",
|
||
"result": [
|
||
"```json\n{\"test\":\"data\",\"timestamp\":\"2025-04-02T19:23:59.217Z\"}\n```"
|
||
],
|
||
"expected": "{\"test\":\"data\",\"timestamp\":\"2025-04-02T19:23:59.217Z\"}",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:24:04.105Z",
|
||
"passed": false,
|
||
"duration": 4888,
|
||
"reason": "Expected {\"test\":\"data\",\"timestamp\":\"2025-04-02T19:23:59.217Z\"}, but got ```json\n{\"test\":\"data\",\"timestamp\":\"2025-04-02t19:23:59.217z\"}\n```",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "directory_listing",
|
||
"prompt": "List all files in the directory C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data. Return the list as a JSON array of filenames.",
|
||
"result": [
|
||
"I cannot assist with seeking content from your files."
|
||
],
|
||
"expected": "[]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:24:07.315Z",
|
||
"passed": false,
|
||
"duration": 3205,
|
||
"reason": "Expected [], but got i cannot assist with seeking content from your files.",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "equation_solving",
|
||
"prompt": "Read the file at C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\tools.test.md and solve all equations. Return the results in the specified JSON format.",
|
||
"result": [
|
||
"It seems that I don't have automatic access to read files from your system. I can guide you on how to get the content of the file or you can paste the equations here, and I can help you solve them. What would you prefer?"
|
||
],
|
||
"expected": "[{\"equation\":\"2x + 5 = 13\",\"result\":\"4\"},{\"equation\":\"3y - 7 = 20\",\"result\":\"9\"},{\"equation\":\"4z + 8 = 32\",\"result\":\"6\"}]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:24:28.988Z",
|
||
"passed": false,
|
||
"duration": 4398,
|
||
"reason": "Expected [{\"equation\":\"2x + 5 = 13\",\"result\":\"4\"},{\"equation\":\"3y - 7 = 20\",\"result\":\"9\"},{\"equation\":\"4z + 8 = 32\",\"result\":\"6\"}], but got it seems that i don't have automatic access to read files from your system. i can guide you on how to get the content of the file or you can paste the equations here, and i can help you solve them. what would you prefer?",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "file_operations",
|
||
"prompt": "Write the following data to C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data\\test-data.json and then read it back: {\"test\":\"data\",\"timestamp\":\"2025-04-02T19:24:28.994Z\"}. Return the read data in JSON format.",
|
||
"result": [
|
||
"It seems there was a repeated request for the file's content. To ensure consistency, here is the decoded data from the last correct read attempt:\n\n```json\n{\n \"test\": \"data\",\n \"timestamp\": \"2025-04-02T19:24:28.994Z\"\n}\n```"
|
||
],
|
||
"expected": "{\"test\":\"data\",\"timestamp\":\"2025-04-02T19:24:28.994Z\"}",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:24:42.733Z",
|
||
"passed": false,
|
||
"duration": 13739,
|
||
"reason": "Expected {\"test\":\"data\",\"timestamp\":\"2025-04-02T19:24:28.994Z\"}, but got it seems there was a repeated request for the file's content. to ensure consistency, here is the decoded data from the last correct read attempt:\n\n```json\n{\n \"test\": \"data\",\n \"timestamp\": \"2025-04-02t19:24:28.994z\"\n}\n```",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "directory_listing",
|
||
"prompt": "List all files in the directory C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data. Return the list as a JSON array of filenames.",
|
||
"result": [
|
||
"I am unable to list the files in the directory `C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data`. Please verify that the directory path is correct and accessible."
|
||
],
|
||
"expected": "[]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:24:53.674Z",
|
||
"passed": false,
|
||
"duration": 10936,
|
||
"reason": "Expected [], but got i am unable to list the files in the directory `c:\\users\\zx\\desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data`. please verify that the directory path is correct and accessible.",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "equation_solving",
|
||
"prompt": "Read the file at C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\tools.test.md and solve all equations. Return the results in the specified JSON format.",
|
||
"result": [
|
||
"It seems like the file is not accessible at the moment. Please ensure the file path is correct or try again later."
|
||
],
|
||
"expected": "[{\"equation\":\"2x + 5 = 13\",\"result\":\"4\"},{\"equation\":\"3y - 7 = 20\",\"result\":\"9\"},{\"equation\":\"4z + 8 = 32\",\"result\":\"6\"}]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:25:35.205Z",
|
||
"passed": false,
|
||
"duration": 3155,
|
||
"reason": "Expected [{\"equation\":\"2x + 5 = 13\",\"result\":\"4\"},{\"equation\":\"3y - 7 = 20\",\"result\":\"9\"},{\"equation\":\"4z + 8 = 32\",\"result\":\"6\"}], but got it seems like the file is not accessible at the moment. please ensure the file path is correct or try again later.",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "file_operations",
|
||
"prompt": "Write the following data to C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data\\test-data.json and then read it back: {\"test\":\"data\",\"timestamp\":\"2025-04-02T19:25:35.210Z\"}. Return the read data in JSON format.",
|
||
"result": [
|
||
"{\"test\":\"data\",\"timestamp\":\"2025-04-02T19:25:35.210Z\"}"
|
||
],
|
||
"expected": "{\"test\":\"data\",\"timestamp\":\"2025-04-02T19:25:35.210Z\"}",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:25:40.298Z",
|
||
"passed": false,
|
||
"duration": 5088,
|
||
"reason": "Expected {\"test\":\"data\",\"timestamp\":\"2025-04-02T19:25:35.210Z\"}, but got {\"test\":\"data\",\"timestamp\":\"2025-04-02t19:25:35.210z\"}",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "directory_listing",
|
||
"prompt": "List all files in the directory C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data. Return the list as a JSON array of filenames.",
|
||
"result": [],
|
||
"expected": "[]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:25:55.283Z",
|
||
"passed": false,
|
||
"duration": 14981,
|
||
"reason": "Model returned empty response",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "equation_solving",
|
||
"prompt": "Read the file at C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\units\\tools.test.md and solve all equations. Return the results in the specified JSON format.",
|
||
"result": [
|
||
"It seems I attempted to read a file from your local system but encountered an issue as I don't have direct access to files on your device. Please open the file and paste the equations here, and I'll be happy to help you solve them!"
|
||
],
|
||
"expected": "[{\"equation\":\"2x + 5 = 13\",\"result\":\"4\"},{\"equation\":\"3y - 7 = 20\",\"result\":\"9\"},{\"equation\":\"4z + 8 = 32\",\"result\":\"6\"}]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:27:27.676Z",
|
||
"passed": false,
|
||
"duration": 3474,
|
||
"reason": "Expected [{\"equation\":\"2x + 5 = 13\",\"result\":\"4\"},{\"equation\":\"3y - 7 = 20\",\"result\":\"9\"},{\"equation\":\"4z + 8 = 32\",\"result\":\"6\"}], but got it seems i attempted to read a file from your local system but encountered an issue as i don't have direct access to files on your device. please open the file and paste the equations here, and i'll be happy to help you solve them!",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "file_operations",
|
||
"prompt": "Write the following data to C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data\\test-data.json and then read it back: {\"test\":\"data\",\"timestamp\":\"2025-04-02T19:27:27.682Z\"}. Return the read data in JSON format.",
|
||
"result": [
|
||
"{\"test\":\"data\",\"timestamp\":\"2025-04-02T19:27:27.682Z\"}"
|
||
],
|
||
"expected": "{\"test\":\"data\",\"timestamp\":\"2025-04-02T19:27:27.682Z\"}",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:27:32.435Z",
|
||
"passed": false,
|
||
"duration": 4753,
|
||
"reason": "Expected {\"test\":\"data\",\"timestamp\":\"2025-04-02T19:27:27.682Z\"}, but got {\"test\":\"data\",\"timestamp\":\"2025-04-02t19:27:27.682z\"}",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "directory_listing",
|
||
"prompt": "List all files in the directory C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data. Return the list as a JSON array of filenames.",
|
||
"result": [
|
||
"I am unable to access the directory. Please make sure that the directory path is correct and accessible, or check if there are any permission restrictions. If you have any specific questions or need further assistance, please let me know!"
|
||
],
|
||
"expected": "[]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:27:43.106Z",
|
||
"passed": false,
|
||
"duration": 10667,
|
||
"reason": "Expected [], but got i am unable to access the directory. please make sure that the directory path is correct and accessible, or check if there are any permission restrictions. if you have any specific questions or need further assistance, please let me know!",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "equation_solving",
|
||
"prompt": "Read the file at C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\units\\tools.test.md and solve all equations. Return the results in the specified JSON format.",
|
||
"result": [
|
||
"I cannot directly access the file as it's on a local system. You can provide its contents, and I'll assist you in solving the equations."
|
||
],
|
||
"expected": "[{\"equation\":\"2x + 5 = 13\",\"result\":\"4\"},{\"equation\":\"3y - 7 = 20\",\"result\":\"9\"},{\"equation\":\"4z + 8 = 32\",\"result\":\"6\"}]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:29:20.992Z",
|
||
"passed": false,
|
||
"duration": 4181,
|
||
"reason": "Expected [{\"equation\":\"2x + 5 = 13\",\"result\":\"4\"},{\"equation\":\"3y - 7 = 20\",\"result\":\"9\"},{\"equation\":\"4z + 8 = 32\",\"result\":\"6\"}], but got i cannot directly access the file as it's on a local system. you can provide its contents, and i'll assist you in solving the equations.",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "file_operations",
|
||
"prompt": "Write the following data to C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data\\test-data.json and then read it back: {\"test\":\"data\",\"timestamp\":\"2025-04-02T19:29:20.998Z\"}. Return the read data in JSON format.",
|
||
"result": [
|
||
"{\"test\":\"data\",\"timestamp\":\"2025-04-02T19:29:20.998Z\"}"
|
||
],
|
||
"expected": "{\"test\":\"data\",\"timestamp\":\"2025-04-02T19:29:20.998Z\"}",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:29:28.241Z",
|
||
"passed": false,
|
||
"duration": 7243,
|
||
"reason": "Expected {\"test\":\"data\",\"timestamp\":\"2025-04-02T19:29:20.998Z\"}, but got {\"test\":\"data\",\"timestamp\":\"2025-04-02t19:29:20.998z\"}",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "directory_listing",
|
||
"prompt": "List all files in the directory C:\\Users\\zx\\Desktop\\polymech\\polymech-mono\\packages\\kbot\\tests\\unit\\test-data. Return the list as a JSON array of filenames.",
|
||
"result": [
|
||
"{\"files\":[]}"
|
||
],
|
||
"expected": "[]",
|
||
"model": "openai/gpt-4o",
|
||
"router": "openai/gpt-4o",
|
||
"timestamp": "2025-04-02T19:29:30.520Z",
|
||
"passed": false,
|
||
"duration": 2274,
|
||
"reason": "Expected [], but got {\"files\":[]}",
|
||
"category": "tools"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T22:06:38.904Z",
|
||
"passed": true,
|
||
"duration": 2263,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T22:06:41.138Z",
|
||
"passed": true,
|
||
"duration": 2228,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T22:06:41.934Z",
|
||
"passed": true,
|
||
"duration": 791,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T22:06:43.239Z",
|
||
"passed": true,
|
||
"duration": 1300,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8 × 3 = 24"
|
||
],
|
||
"expected": "24",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T22:06:46.025Z",
|
||
"passed": false,
|
||
"duration": 2782,
|
||
"reason": "Expected 24, but got 8 × 3 = 24",
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T22:06:47.239Z",
|
||
"passed": true,
|
||
"duration": 1206,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T22:06:48.026Z",
|
||
"passed": true,
|
||
"duration": 783,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T22:06:51.012Z",
|
||
"passed": true,
|
||
"duration": 2982,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T22:06:51.777Z",
|
||
"passed": true,
|
||
"duration": 760,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T22:08:37.779Z",
|
||
"passed": false,
|
||
"duration": 1244,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"The solutions to the quadratic equation x² + 5x + 6 = 0 are -2 and -3.\n\n\\boxed{-2}, \\boxed{-3}"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T22:08:48.803Z",
|
||
"passed": false,
|
||
"duration": 11013,
|
||
"reason": "Expected -3,-2, but got the solutions to the quadratic equation x² + 5x + 6 = 0 are -2 and -3.\n\n\\boxed{-2}, \\boxed{-3}",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-3,-2",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T22:08:50.291Z",
|
||
"passed": false,
|
||
"duration": 1482,
|
||
"reason": "Expected -3,-2, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T22:08:51.033Z",
|
||
"passed": true,
|
||
"duration": 736,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T22:08:55.877Z",
|
||
"passed": true,
|
||
"duration": 4838,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T22:08:56.613Z",
|
||
"passed": true,
|
||
"duration": 730,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T22:08:57.421Z",
|
||
"passed": true,
|
||
"duration": 802,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"The 6th number in the Fibonacci sequence is 5. \n\n5"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T22:09:04.449Z",
|
||
"passed": false,
|
||
"duration": 7023,
|
||
"reason": "Expected 8, but got the 6th number in the fibonacci sequence is 5. \n\n5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T22:09:05.286Z",
|
||
"passed": false,
|
||
"duration": 831,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T22:09:06.233Z",
|
||
"passed": true,
|
||
"duration": 940,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T22:09:08.662Z",
|
||
"passed": true,
|
||
"duration": 2423,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T22:09:09.441Z",
|
||
"passed": true,
|
||
"duration": 773,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T22:09:10.298Z",
|
||
"passed": true,
|
||
"duration": 851,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T22:09:11.870Z",
|
||
"passed": true,
|
||
"duration": 1566,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T22:09:12.628Z",
|
||
"passed": true,
|
||
"duration": 753,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-2,-3",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T22:11:07.251Z",
|
||
"passed": false,
|
||
"duration": 1329,
|
||
"reason": "Expected -2,-3, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-2,-3",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T22:11:14.807Z",
|
||
"passed": false,
|
||
"duration": 7547,
|
||
"reason": "Expected -2,-3, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-2,-3",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T22:11:15.551Z",
|
||
"passed": false,
|
||
"duration": 738,
|
||
"reason": "Expected -2,-3, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T22:11:16.305Z",
|
||
"passed": true,
|
||
"duration": 749,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T22:11:21.413Z",
|
||
"passed": true,
|
||
"duration": 5102,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T22:11:22.690Z",
|
||
"passed": true,
|
||
"duration": 1271,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T22:11:23.404Z",
|
||
"passed": true,
|
||
"duration": 707,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T22:11:32.032Z",
|
||
"passed": false,
|
||
"duration": 8621,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T22:11:33.022Z",
|
||
"passed": false,
|
||
"duration": 983,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T22:11:33.875Z",
|
||
"passed": true,
|
||
"duration": 845,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T22:11:37.488Z",
|
||
"passed": true,
|
||
"duration": 3608,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T22:11:38.246Z",
|
||
"passed": true,
|
||
"duration": 753,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-02T22:11:39.169Z",
|
||
"passed": true,
|
||
"duration": 918,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-02T22:11:43.117Z",
|
||
"passed": true,
|
||
"duration": 3943,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-02T22:11:44.077Z",
|
||
"passed": true,
|
||
"duration": 954,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-3, -2"
|
||
],
|
||
"expected": "-2,-3",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-03T17:09:38.709Z",
|
||
"passed": false,
|
||
"duration": 1685,
|
||
"reason": "Expected -2,-3, but got -3, -2",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"The solutions to the quadratic equation x² + 5x + 6 = 0 are -2 and -3.\n\nSpecific steps:\n\n1. **Identify coefficients**: a = 1, b = 5, c = 6.\n2. **Calculate discriminant**: b² - 4ac = 25 - 24 = 1.\n3. **Apply quadratic formula**: x = (-5 ± √1)/2.\n4. **Compute solutions**: x = (-5 + 1)/2 = -2 and x = (-5 - 1)/2 = -3.\n\n-2, -3\n\nAnswer: -2,-3"
|
||
],
|
||
"expected": "-2,-3",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-03T17:09:49.547Z",
|
||
"passed": false,
|
||
"duration": 10827,
|
||
"reason": "Expected -2,-3, but got the solutions to the quadratic equation x² + 5x + 6 = 0 are -2 and -3.\n\nspecific steps:\n\n1. **identify coefficients**: a = 1, b = 5, c = 6.\n2. **calculate discriminant**: b² - 4ac = 25 - 24 = 1.\n3. **apply quadratic formula**: x = (-5 ± √1)/2.\n4. **compute solutions**: x = (-5 + 1)/2 = -2 and x = (-5 - 1)/2 = -3.\n\n-2, -3\n\nanswer: -2,-3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-2,-3",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-03T17:09:50.489Z",
|
||
"passed": false,
|
||
"duration": 935,
|
||
"reason": "Expected -2,-3, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-03T17:09:54.489Z",
|
||
"passed": true,
|
||
"duration": 3991,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"5! = 120\n\nThe factorial of 5 is calculated as:\n\n5 × 4 × 3 × 2 × 1 = 120\n\n**Answer:** 120"
|
||
],
|
||
"expected": "120",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-03T17:10:03.614Z",
|
||
"passed": false,
|
||
"duration": 9116,
|
||
"reason": "Expected 120, but got 5! = 120\n\nthe factorial of 5 is calculated as:\n\n5 × 4 × 3 × 2 × 1 = 120\n\n**answer:** 120",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-03T17:10:04.483Z",
|
||
"passed": true,
|
||
"duration": 861,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-03T17:10:05.284Z",
|
||
"passed": true,
|
||
"duration": 792,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-03T17:10:13.584Z",
|
||
"passed": false,
|
||
"duration": 8292,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-03T17:10:14.350Z",
|
||
"passed": false,
|
||
"duration": 756,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-03T17:10:15.250Z",
|
||
"passed": true,
|
||
"duration": 892,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-03T17:10:17.013Z",
|
||
"passed": true,
|
||
"duration": 1755,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-03T17:10:17.849Z",
|
||
"passed": true,
|
||
"duration": 828,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-03T17:10:18.651Z",
|
||
"passed": true,
|
||
"duration": 795,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-03T17:10:25.922Z",
|
||
"passed": true,
|
||
"duration": 7263,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-03T17:10:26.895Z",
|
||
"passed": true,
|
||
"duration": 966,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-03T17:14:04.393Z",
|
||
"passed": true,
|
||
"duration": 1484,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-03T17:14:12.861Z",
|
||
"passed": true,
|
||
"duration": 8460,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-03T17:14:13.779Z",
|
||
"passed": true,
|
||
"duration": 910,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-03T17:14:14.740Z",
|
||
"passed": true,
|
||
"duration": 955,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-03T17:14:22.399Z",
|
||
"passed": true,
|
||
"duration": 7653,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-03T17:14:23.502Z",
|
||
"passed": true,
|
||
"duration": 1095,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-03T17:14:24.325Z",
|
||
"passed": true,
|
||
"duration": 816,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"15 divided by 3 is 5. \n\nAnswer: 5"
|
||
],
|
||
"expected": "5",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-03T17:14:40.987Z",
|
||
"passed": false,
|
||
"duration": 16655,
|
||
"reason": "Expected 5, but got 15 divided by 3 is 5. \n\nanswer: 5",
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-03T17:14:41.951Z",
|
||
"passed": true,
|
||
"duration": 954,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:36:55.754Z",
|
||
"passed": true,
|
||
"duration": 1505,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:36:59.232Z",
|
||
"passed": true,
|
||
"duration": 3470,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:37:00.080Z",
|
||
"passed": true,
|
||
"duration": 842,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"prompt": "add 5 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:37:00.897Z",
|
||
"passed": true,
|
||
"duration": 811,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:37:01.784Z",
|
||
"passed": true,
|
||
"duration": 881,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [],
|
||
"expected": "24",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:37:03.117Z",
|
||
"passed": false,
|
||
"duration": 1327,
|
||
"reason": "Model returned empty response",
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:37:04.222Z",
|
||
"passed": true,
|
||
"duration": 1096,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"prompt": "multiply 8 and 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"24"
|
||
],
|
||
"expected": "24",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:37:05.008Z",
|
||
"passed": true,
|
||
"duration": 780,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:37:05.799Z",
|
||
"passed": true,
|
||
"duration": 784,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:37:10.272Z",
|
||
"passed": true,
|
||
"duration": 4467,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:37:11.255Z",
|
||
"passed": true,
|
||
"duration": 975,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "division",
|
||
"prompt": "divide 15 by 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "5",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:37:11.993Z",
|
||
"passed": true,
|
||
"duration": 731,
|
||
"category": "basic"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-2,-3",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:38:12.580Z",
|
||
"passed": true,
|
||
"duration": 1229,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"The solutions to the quadratic equation x² + 5x + 6 = 0 are -3, -2.\n\nAnswer: -3, -2"
|
||
],
|
||
"expected": "-2,-3",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:38:24.221Z",
|
||
"passed": false,
|
||
"duration": 11633,
|
||
"reason": "Expected -2,-3, but got the solutions to the quadratic equation x² + 5x + 6 = 0 are -3, -2.\n\nanswer: -3, -2",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2, -3"
|
||
],
|
||
"expected": "-2,-3",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:38:25.175Z",
|
||
"passed": false,
|
||
"duration": 943,
|
||
"reason": "Expected -2,-3, but got -2, -3",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "quadratic",
|
||
"prompt": "Solve the quadratic equation x² + 5x + 6 = 0. Return only the solutions as comma-separated numbers, no explanation.",
|
||
"result": [
|
||
"-2,-3"
|
||
],
|
||
"expected": "-2,-3",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:38:26.290Z",
|
||
"passed": true,
|
||
"duration": 1105,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:38:27.138Z",
|
||
"passed": true,
|
||
"duration": 838,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:38:34.971Z",
|
||
"passed": true,
|
||
"duration": 7825,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:38:35.899Z",
|
||
"passed": true,
|
||
"duration": 920,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"prompt": "Calculate 5! (factorial of 5). Return only the number, no explanation.",
|
||
"result": [
|
||
"120"
|
||
],
|
||
"expected": "120",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:38:36.748Z",
|
||
"passed": true,
|
||
"duration": 840,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:38:37.951Z",
|
||
"passed": true,
|
||
"duration": 1195,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:38:49.318Z",
|
||
"passed": false,
|
||
"duration": 11358,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"5"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:38:50.264Z",
|
||
"passed": false,
|
||
"duration": 935,
|
||
"reason": "Expected 8, but got 5",
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"prompt": "Calculate the 6th number in the Fibonacci sequence. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:38:50.973Z",
|
||
"passed": true,
|
||
"duration": 701,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:38:51.774Z",
|
||
"passed": true,
|
||
"duration": 793,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:39:08.114Z",
|
||
"passed": true,
|
||
"duration": 16332,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:39:09.133Z",
|
||
"passed": true,
|
||
"duration": 1012,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"prompt": "Calculate the square root of 16. Return only the number, no explanation.",
|
||
"result": [
|
||
"4"
|
||
],
|
||
"expected": "4",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:39:10.677Z",
|
||
"passed": true,
|
||
"duration": 1535,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:39:11.607Z",
|
||
"passed": true,
|
||
"duration": 922,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:39:18.707Z",
|
||
"passed": true,
|
||
"duration": 7091,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:39:19.719Z",
|
||
"passed": true,
|
||
"duration": 1004,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "power",
|
||
"prompt": "Calculate 2 raised to the power of 3. Return only the number, no explanation.",
|
||
"result": [
|
||
"8"
|
||
],
|
||
"expected": "8",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:39:21.294Z",
|
||
"passed": true,
|
||
"duration": 1567,
|
||
"category": "math"
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"prompt": "Generate a JavaScript function that adds two numbers and returns the result. \n The function should be named 'add' and take two parameters 'a' and 'b'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function add(a, b) {\n return a + b;\n}"
|
||
],
|
||
"expected": "function add(a, b) { return a + b; }",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:44:45.218Z",
|
||
"passed": false,
|
||
"duration": 1435,
|
||
"reason": "Expected function add(a, b) { return a + b; }, but got function add(a, b) {\n return a + b;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"prompt": "Generate a JavaScript function that adds two numbers and returns the result. \n The function should be named 'add' and take two parameters 'a' and 'b'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function add(a, b) {\n return a + b;\n}"
|
||
],
|
||
"expected": "function add(a, b) { return a + b; }",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:44:49.883Z",
|
||
"passed": false,
|
||
"duration": 4655,
|
||
"reason": "Expected function add(a, b) { return a + b; }, but got function add(a, b) {\n return a + b;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"prompt": "Generate a JavaScript function that adds two numbers and returns the result. \n The function should be named 'add' and take two parameters 'a' and 'b'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction add(a, b) {\n return a + b;\n}\n```"
|
||
],
|
||
"expected": "function add(a, b) { return a + b; }",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:44:51.127Z",
|
||
"passed": false,
|
||
"duration": 1237,
|
||
"reason": "Expected function add(a, b) { return a + b; }, but got ```javascript\nfunction add(a, b) {\n return a + b;\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"prompt": "Generate a JavaScript function that adds two numbers and returns the result. \n The function should be named 'add' and take two parameters 'a' and 'b'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction add(a, b) {\n return a + b;\n}\n```"
|
||
],
|
||
"expected": "function add(a, b) { return a + b; }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:44:52.054Z",
|
||
"passed": false,
|
||
"duration": 917,
|
||
"reason": "Expected function add(a, b) { return a + b; }, but got ```javascript\nfunction add(a, b) {\n return a + b;\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction factorial(n) {\n if (n === 0 || n === 1) {\n return 1;\n } else {\n return n * factorial(n - 1);\n }\n}\n```"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:44:53.187Z",
|
||
"passed": false,
|
||
"duration": 1125,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got ```javascript\nfunction factorial(n) {\n if (n === 0 || n === 1) {\n return 1;\n } else {\n return n * factorial(n - 1);\n }\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n <= 1) return 1;\n let result = 1;\n for (let i = 2; i <= n; i++) {\n result *= i;\n }\n return result;\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:45:02.361Z",
|
||
"passed": false,
|
||
"duration": 9166,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n <= 1) return 1;\n let result = 1;\n for (let i = 2; i <= n; i++) {\n result *= i;\n }\n return result;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction factorial(n) {\n if (n < 0) return undefined;\n if (n === 0) return 1;\n let result = 1;\n for (let i = 1; i <= n; i++) {\n result *= i;\n }\n return result;\n}\n```"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:45:04.060Z",
|
||
"passed": false,
|
||
"duration": 1690,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got ```javascript\nfunction factorial(n) {\n if (n < 0) return undefined;\n if (n === 0) return 1;\n let result = 1;\n for (let i = 1; i <= n; i++) {\n result *= i;\n }\n return result;\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:45:05.043Z",
|
||
"passed": false,
|
||
"duration": 975,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"prompt": "Generate a JavaScript function that calculates the nth Fibonacci number.\n The function should be named 'fibonacci' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction fibonacci(n) {\n if (n <= 1) return n;\n return fibonacci(n - 1) + fibonacci(n - 2);\n}\n```"
|
||
],
|
||
"expected": "function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:45:06.250Z",
|
||
"passed": false,
|
||
"duration": 1200,
|
||
"reason": "Expected function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }, but got ```javascript\nfunction fibonacci(n) {\n if (n <= 1) return n;\n return fibonacci(n - 1) + fibonacci(n - 2);\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"prompt": "Generate a JavaScript function that calculates the nth Fibonacci number.\n The function should be named 'fibonacci' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function fibonacci(n) {\n if (n === 0) return 0;\n if (n === 1) return 1;\n let a = 0, b = 1;\n for (let i = 2; i <= n; i++) {\n let temp = a;\n a = b;\n b = temp + b;\n }\n return b;\n}"
|
||
],
|
||
"expected": "function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:45:22.955Z",
|
||
"passed": false,
|
||
"duration": 16697,
|
||
"reason": "Expected function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }, but got function fibonacci(n) {\n if (n === 0) return 0;\n if (n === 1) return 1;\n let a = 0, b = 1;\n for (let i = 2; i <= n; i++) {\n let temp = a;\n a = b;\n b = temp + b;\n }\n return b;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"prompt": "Generate a JavaScript function that calculates the nth Fibonacci number.\n The function should be named 'fibonacci' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction fibonacci(n) {\n if (n <= 0) return 0;\n if (n === 1) return 1;\n let a = 0, b = 1, temp;\n for (let i = 2; i <= n; i++) {\n temp = a + b;\n a = b;\n b = temp;\n }\n return b;\n}\n```"
|
||
],
|
||
"expected": "function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:45:25.030Z",
|
||
"passed": false,
|
||
"duration": 2068,
|
||
"reason": "Expected function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }, but got ```javascript\nfunction fibonacci(n) {\n if (n <= 0) return 0;\n if (n === 1) return 1;\n let a = 0, b = 1, temp;\n for (let i = 2; i <= n; i++) {\n temp = a + b;\n a = b;\n b = temp;\n }\n return b;\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"prompt": "Generate a JavaScript function that calculates the nth Fibonacci number.\n The function should be named 'fibonacci' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction fibonacci(n) {\n if (n <= 0) return 0;\n if (n === 1) return 1;\n let a = 0, b = 1, temp;\n for (let i = 2; i <= n; i++) {\n temp = a + b;\n a = b;\n b = temp;\n }\n return b;\n}\n```"
|
||
],
|
||
"expected": "function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:45:27.584Z",
|
||
"passed": false,
|
||
"duration": 2546,
|
||
"reason": "Expected function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }, but got ```javascript\nfunction fibonacci(n) {\n if (n <= 0) return 0;\n if (n === 1) return 1;\n let a = 0, b = 1, temp;\n for (let i = 2; i <= n; i++) {\n temp = a + b;\n a = b;\n b = temp;\n }\n return b;\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"prompt": "Generate a JavaScript function that adds two numbers and returns the result. \n The function should be named 'add' and take two parameters 'a' and 'b'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction add(a, b) {\n return a + b;\n}\n```"
|
||
],
|
||
"expected": "function add(a, b) { return a + b; }",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:45:51.588Z",
|
||
"passed": false,
|
||
"duration": 1992,
|
||
"reason": "Expected function add(a, b) { return a + b; }, but got ```javascript\nfunction add(a, b) {\n return a + b;\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"prompt": "Generate a JavaScript function that adds two numbers and returns the result. \n The function should be named 'add' and take two parameters 'a' and 'b'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function add(a, b) {\n return a + b;\n}"
|
||
],
|
||
"expected": "function add(a, b) { return a + b; }",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:45:55.658Z",
|
||
"passed": false,
|
||
"duration": 4061,
|
||
"reason": "Expected function add(a, b) { return a + b; }, but got function add(a, b) {\n return a + b;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"prompt": "Generate a JavaScript function that adds two numbers and returns the result. \n The function should be named 'add' and take two parameters 'a' and 'b'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction add(a, b) {\n return a + b;\n}\n```"
|
||
],
|
||
"expected": "function add(a, b) { return a + b; }",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:45:56.953Z",
|
||
"passed": false,
|
||
"duration": 1287,
|
||
"reason": "Expected function add(a, b) { return a + b; }, but got ```javascript\nfunction add(a, b) {\n return a + b;\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"prompt": "Generate a JavaScript function that adds two numbers and returns the result. \n The function should be named 'add' and take two parameters 'a' and 'b'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction add(a, b) {\n return a + b;\n}\n```"
|
||
],
|
||
"expected": "function add(a, b) { return a + b; }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:45:57.801Z",
|
||
"passed": false,
|
||
"duration": 840,
|
||
"reason": "Expected function add(a, b) { return a + b; }, but got ```javascript\nfunction add(a, b) {\n return a + b;\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction factorial(n) {\n if (n === 0) {\n return 1;\n } else {\n return n * factorial(n - 1);\n }\n}\n```"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:45:59.452Z",
|
||
"passed": false,
|
||
"duration": 1644,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got ```javascript\nfunction factorial(n) {\n if (n === 0) {\n return 1;\n } else {\n return n * factorial(n - 1);\n }\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n < 2) return 1;\n let result = 1;\n for (let i = 2; i <= n; i++) {\n result *= i;\n }\n return result;\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:46:05.931Z",
|
||
"passed": false,
|
||
"duration": 6471,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n < 2) return 1;\n let result = 1;\n for (let i = 2; i <= n; i++) {\n result *= i;\n }\n return result;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction factorial(n) {\n if (n < 0) return undefined;\n if (n === 0) return 1;\n let result = 1;\n for (let i = 1; i <= n; i++) {\n result *= i;\n }\n return result;\n}\n```"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:46:07.867Z",
|
||
"passed": false,
|
||
"duration": 1927,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got ```javascript\nfunction factorial(n) {\n if (n < 0) return undefined;\n if (n === 0) return 1;\n let result = 1;\n for (let i = 1; i <= n; i++) {\n result *= i;\n }\n return result;\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n < 0) return undefined;\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:46:09.006Z",
|
||
"passed": false,
|
||
"duration": 1131,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n < 0) return undefined;\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"prompt": "Generate a JavaScript function that calculates the nth Fibonacci number.\n The function should be named 'fibonacci' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction fibonacci(n) {\n if (n <= 1) {\n return n;\n } else {\n return fibonacci(n - 1) + fibonacci(n - 2);\n }\n}\n```"
|
||
],
|
||
"expected": "function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:46:10.511Z",
|
||
"passed": false,
|
||
"duration": 1496,
|
||
"reason": "Expected function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }, but got ```javascript\nfunction fibonacci(n) {\n if (n <= 1) {\n return n;\n } else {\n return fibonacci(n - 1) + fibonacci(n - 2);\n }\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"prompt": "Generate a JavaScript function that calculates the nth Fibonacci number.\n The function should be named 'fibonacci' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function fibonacci(n) {\n let a = 0, b = 1;\n if (n === 0) return a;\n for (let i = 2; i <= n; i++) {\n let next = a + b;\n a = b;\n b = next;\n }\n return b;\n}"
|
||
],
|
||
"expected": "function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:46:28.567Z",
|
||
"passed": false,
|
||
"duration": 18048,
|
||
"reason": "Expected function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }, but got function fibonacci(n) {\n let a = 0, b = 1;\n if (n === 0) return a;\n for (let i = 2; i <= n; i++) {\n let next = a + b;\n a = b;\n b = next;\n }\n return b;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"prompt": "Generate a JavaScript function that calculates the nth Fibonacci number.\n The function should be named 'fibonacci' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction fibonacci(n) {\n if (n <= 1) return n;\n let a = 0, b = 1, temp;\n for (let i = 2; i <= n; i++) {\n temp = a + b;\n a = b;\n b = temp;\n }\n return b;\n}\n```"
|
||
],
|
||
"expected": "function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:46:31.014Z",
|
||
"passed": false,
|
||
"duration": 2439,
|
||
"reason": "Expected function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }, but got ```javascript\nfunction fibonacci(n) {\n if (n <= 1) return n;\n let a = 0, b = 1, temp;\n for (let i = 2; i <= n; i++) {\n temp = a + b;\n a = b;\n b = temp;\n }\n return b;\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"prompt": "Generate a JavaScript function that calculates the nth Fibonacci number.\n The function should be named 'fibonacci' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"```javascript\nfunction fibonacci(n) {\n if (n <= 0) return 0;\n if (n === 1) return 1;\n let a = 0, b = 1;\n for (let i = 2; i <= n; i++) {\n [a, b] = [b, a + b];\n }\n return b;\n}\n```"
|
||
],
|
||
"expected": "function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:46:32.933Z",
|
||
"passed": false,
|
||
"duration": 1911,
|
||
"reason": "Expected function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }, but got ```javascript\nfunction fibonacci(n) {\n if (n <= 0) return 0;\n if (n === 1) return 1;\n let a = 0, b = 1;\n for (let i = 2; i <= n; i++) {\n [a, b] = [b, a + b];\n }\n return b;\n}\n```",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"prompt": "Generate a JavaScript function that adds two numbers and returns the result. \n The function should be named 'add' and take two parameters 'a' and 'b'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function add(a, b) {\n return a + b;\n}"
|
||
],
|
||
"expected": "function add(a, b) { return a + b; }",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:50:37.864Z",
|
||
"passed": false,
|
||
"duration": 1441,
|
||
"reason": "Expected function add(a, b) { return a + b; }, but got function add(a, b) {\n return a + b;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"prompt": "Generate a JavaScript function that adds two numbers and returns the result. \n The function should be named 'add' and take two parameters 'a' and 'b'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function add(a, b) {\n return a + b;\n}"
|
||
],
|
||
"expected": "function add(a, b) { return a + b; }",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:50:42.826Z",
|
||
"passed": false,
|
||
"duration": 4953,
|
||
"reason": "Expected function add(a, b) { return a + b; }, but got function add(a, b) {\n return a + b;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"prompt": "Generate a JavaScript function that adds two numbers and returns the result. \n The function should be named 'add' and take two parameters 'a' and 'b'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function add(a, b) {\n return a + b;\n}"
|
||
],
|
||
"expected": "function add(a, b) { return a + b; }",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:50:44.254Z",
|
||
"passed": false,
|
||
"duration": 1420,
|
||
"reason": "Expected function add(a, b) { return a + b; }, but got function add(a, b) {\n return a + b;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"prompt": "Generate a JavaScript function that adds two numbers and returns the result. \n The function should be named 'add' and take two parameters 'a' and 'b'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function add(a, b) {\n return a + b;\n}"
|
||
],
|
||
"expected": "function add(a, b) { return a + b; }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:50:45.251Z",
|
||
"passed": false,
|
||
"duration": 989,
|
||
"reason": "Expected function add(a, b) { return a + b; }, but got function add(a, b) {\n return a + b;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n === 0) {\n return 1;\n } else {\n return n * factorial(n - 1);\n }\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:50:46.448Z",
|
||
"passed": false,
|
||
"duration": 1187,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n === 0) {\n return 1;\n } else {\n return n * factorial(n - 1);\n }\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n let result = 1;\n for (let i = 1; i <= n; i++) {\n result *= i;\n }\n return result;\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:50:52.751Z",
|
||
"passed": false,
|
||
"duration": 6295,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n let result = 1;\n for (let i = 1; i <= n; i++) {\n result *= i;\n }\n return result;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:50:54.086Z",
|
||
"passed": false,
|
||
"duration": 1326,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:50:55.060Z",
|
||
"passed": false,
|
||
"duration": 965,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"prompt": "Generate a JavaScript function that calculates the nth Fibonacci number.\n The function should be named 'fibonacci' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function fibonacci(n) {\n if (n <= 1) {\n return n;\n }\n\n return fibonacci(n - 1) + fibonacci(n - 2);\n}"
|
||
],
|
||
"expected": "function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T12:50:56.266Z",
|
||
"passed": false,
|
||
"duration": 1198,
|
||
"reason": "Expected function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }, but got function fibonacci(n) {\n if (n <= 1) {\n return n;\n }\n\n return fibonacci(n - 1) + fibonacci(n - 2);\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"prompt": "Generate a JavaScript function that calculates the nth Fibonacci number.\n The function should be named 'fibonacci' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function fibonacci(n) {\n if (n === 0) return 0;\n if (n === 1 || n === 2) return 1;\n let a = 1, b = 1, temp;\n for (let i = 3; i <= n; i++) {\n temp = a;\n a = a + b;\n b = temp;\n }\n return a;\n}"
|
||
],
|
||
"expected": "function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T12:51:06.690Z",
|
||
"passed": false,
|
||
"duration": 10417,
|
||
"reason": "Expected function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }, but got function fibonacci(n) {\n if (n === 0) return 0;\n if (n === 1 || n === 2) return 1;\n let a = 1, b = 1, temp;\n for (let i = 3; i <= n; i++) {\n temp = a;\n a = a + b;\n b = temp;\n }\n return a;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"prompt": "Generate a JavaScript function that calculates the nth Fibonacci number.\n The function should be named 'fibonacci' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function fibonacci(n) {\n if (n <= 1) return n;\n let a = 0, b = 1, c;\n for (let i = 2; i <= n; i++) {\n c = a + b;\n a = b;\n b = c;\n }\n return b;\n}"
|
||
],
|
||
"expected": "function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T12:51:09.116Z",
|
||
"passed": false,
|
||
"duration": 2418,
|
||
"reason": "Expected function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }, but got function fibonacci(n) {\n if (n <= 1) return n;\n let a = 0, b = 1, c;\n for (let i = 2; i <= n; i++) {\n c = a + b;\n a = b;\n b = c;\n }\n return b;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"prompt": "Generate a JavaScript function that calculates the nth Fibonacci number.\n The function should be named 'fibonacci' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function fibonacci(n) {\n if (n <= 0) return 0;\n if (n === 1) return 1;\n let a = 0, b = 1;\n for (let i = 2; i <= n; i++) {\n [a, b] = [b, a + b];\n }\n return b;\n}"
|
||
],
|
||
"expected": "function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:51:11.294Z",
|
||
"passed": false,
|
||
"duration": 2169,
|
||
"reason": "Expected function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }, but got function fibonacci(n) {\n if (n <= 0) return 0;\n if (n === 1) return 1;\n let a = 0, b = 1;\n for (let i = 2; i <= n; i++) {\n [a, b] = [b, a + b];\n }\n return b;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"prompt": "Generate a JavaScript function that adds two numbers and returns the result. \n The function should be named 'add' and take two parameters 'a' and 'b'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function add(a, b) {\n return a + b;\n}"
|
||
],
|
||
"expected": "function add(a, b) { return a + b; }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:52:19.974Z",
|
||
"passed": false,
|
||
"duration": 1425,
|
||
"reason": "Expected function add(a, b) { return a + b; }, but got function add(a, b) {\n return a + b;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n === 0 || n === 1) {\n return 1;\n }\n return n * factorial(n - 1);\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:52:20.932Z",
|
||
"passed": false,
|
||
"duration": 948,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n === 0 || n === 1) {\n return 1;\n }\n return n * factorial(n - 1);\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"prompt": "Generate a JavaScript function that calculates the nth Fibonacci number.\n The function should be named 'fibonacci' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function fibonacci(n) {\n if (n <= 0) return 0;\n if (n === 1) return 1;\n let a = 0, b = 1;\n for (let i = 2; i <= n; i++) {\n let temp = a + b;\n a = b;\n b = temp;\n }\n return b;\n}"
|
||
],
|
||
"expected": "function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T12:52:22.228Z",
|
||
"passed": false,
|
||
"duration": 1287,
|
||
"reason": "Expected function fibonacci(n) { return n <= 1 ? n : fibonacci(n - 1) + fibonacci(n - 2); }, but got function fibonacci(n) {\n if (n <= 0) return 0;\n if (n === 1) return 1;\n let a = 0, b = 1;\n for (let i = 2; i <= n; i++) {\n let temp = a + b;\n a = b;\n b = temp;\n }\n return b;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T13:06:05.000Z",
|
||
"passed": false,
|
||
"duration": 1461,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T13:07:20.672Z",
|
||
"passed": false,
|
||
"duration": 1565,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n <= 1) {\n return 1;\n }\n return n * factorial(n - 1);\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T13:09:05.033Z",
|
||
"passed": false,
|
||
"duration": 2296,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n <= 1) {\n return 1;\n }\n return n * factorial(n - 1);\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "bubble_sort_function",
|
||
"prompt": "Generate a JavaScript function that implements bubble sort.\n The function should be named 'bubbleSort' and take one parameter 'arr' (an array of numbers).\n The function should return the sorted array.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function bubbleSort(arr) {\n let n = arr.length;\n for(let i = 0; i < n - 1; i++) {\n for(let j = 0; j < n - i - 1; j++) {\n if(arr[j] > arr[j + 1]) {\n let temp = arr[j];\n arr[j] = arr[j + 1];\n arr[j + 1] = temp;\n }\n }\n }\n return arr;\n}"
|
||
],
|
||
"expected": "function bubbleSort(arr) { const n = arr.length; for(let i = 0; i < n; i++) { for(let j = 0; j < n-i-1; j++) { if(arr[j] > arr[j+1]) { [arr[j], arr[j+1]] = [arr[j+1], arr[j]]; } } } return arr; }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T13:09:07.513Z",
|
||
"passed": false,
|
||
"duration": 2471,
|
||
"reason": "Expected function bubbleSort(arr) { const n = arr.length; for(let i = 0; i < n; i++) { for(let j = 0; j < n-i-1; j++) { if(arr[j] > arr[j+1]) { [arr[j], arr[j+1]] = [arr[j+1], arr[j]]; } } } return arr; }, but got function bubblesort(arr) {\n let n = arr.length;\n for(let i = 0; i < n - 1; i++) {\n for(let j = 0; j < n - i - 1; j++) {\n if(arr[j] > arr[j + 1]) {\n let temp = arr[j];\n arr[j] = arr[j + 1];\n arr[j + 1] = temp;\n }\n }\n }\n return arr;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n < 0) return undefined;\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T13:10:24.287Z",
|
||
"passed": false,
|
||
"duration": 1666,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n < 0) return undefined;\n if (n === 0 || n === 1) return 1;\n return n * factorial(n - 1);\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "bubble_sort_function",
|
||
"prompt": "Generate a JavaScript function that implements bubble sort.\n The function should be named 'bubbleSort' and take one parameter 'arr' (an array of numbers).\n The function should return the sorted array.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function bubbleSort(arr) {\n let n = arr.length;\n for(let i = 0; i < n - 1; i++) {\n for(let j = 0; j < n - i - 1; j++) {\n if(arr[j] > arr[j + 1]) {\n let temp = arr[j];\n arr[j] = arr[j + 1];\n arr[j + 1] = temp;\n }\n }\n }\n return arr;\n}"
|
||
],
|
||
"expected": "function bubbleSort(arr) { const n = arr.length; for(let i = 0; i < n; i++) { for(let j = 0; j < n-i-1; j++) { if(arr[j] > arr[j+1]) { [arr[j], arr[j+1]] = [arr[j+1], arr[j]]; } } } return arr; }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T13:10:26.072Z",
|
||
"passed": false,
|
||
"duration": 1775,
|
||
"reason": "Expected function bubbleSort(arr) { const n = arr.length; for(let i = 0; i < n; i++) { for(let j = 0; j < n-i-1; j++) { if(arr[j] > arr[j+1]) { [arr[j], arr[j+1]] = [arr[j+1], arr[j]]; } } } return arr; }, but got function bubblesort(arr) {\n let n = arr.length;\n for(let i = 0; i < n - 1; i++) {\n for(let j = 0; j < n - i - 1; j++) {\n if(arr[j] > arr[j + 1]) {\n let temp = arr[j];\n arr[j] = arr[j + 1];\n arr[j + 1] = temp;\n }\n }\n }\n return arr;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n === 0 || n === 1) {\n return 1;\n } else {\n return n * factorial(n - 1);\n }\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T13:11:31.687Z",
|
||
"passed": false,
|
||
"duration": 1633,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n === 0 || n === 1) {\n return 1;\n } else {\n return n * factorial(n - 1);\n }\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n <= 1) return 1;\n return n * factorial(n - 1);\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T13:11:36.495Z",
|
||
"passed": false,
|
||
"duration": 4798,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n <= 1) return 1;\n return n * factorial(n - 1);\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n < 0) return undefined;\n if (n === 0 || n === 1) return 1;\n let result = 1;\n for (let i = 2; i <= n; i++) {\n result *= i;\n }\n return result;\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T13:11:39.078Z",
|
||
"passed": false,
|
||
"duration": 2574,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n < 0) return undefined;\n if (n === 0 || n === 1) return 1;\n let result = 1;\n for (let i = 2; i <= n; i++) {\n result *= i;\n }\n return result;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"prompt": "Generate a JavaScript function that calculates the factorial of a number.\n The function should be named 'factorial' and take one parameter 'n'.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function factorial(n) {\n if (n === 0 || n === 1) {\n return 1;\n }\n return n * factorial(n - 1);\n}"
|
||
],
|
||
"expected": "function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T13:11:44.323Z",
|
||
"passed": false,
|
||
"duration": 5237,
|
||
"reason": "Expected function factorial(n) { return n <= 1 ? 1 : n * factorial(n - 1); }, but got function factorial(n) {\n if (n === 0 || n === 1) {\n return 1;\n }\n return n * factorial(n - 1);\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "bubble_sort_function",
|
||
"prompt": "Generate a JavaScript function that implements bubble sort.\n The function should be named 'bubbleSort' and take one parameter 'arr' (an array of numbers).\n The function should return the sorted array.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function bubbleSort(arr) {\n let i, j;\n for (i = 0; i < arr.length-1; i++) {\n for (j = 0; j < arr.length-i-1; j++) {\n if (arr[j] > arr[j+1]) {\n let temp = arr[j];\n arr[j] = arr[j+1];\n arr[j+1] = temp;\n }\n }\n }\n return arr;\n}"
|
||
],
|
||
"expected": "function bubbleSort(arr) { const n = arr.length; for(let i = 0; i < n; i++) { for(let j = 0; j < n-i-1; j++) { if(arr[j] > arr[j+1]) { [arr[j], arr[j+1]] = [arr[j+1], arr[j]]; } } } return arr; }",
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"router": "openai/gpt-3.5-turbo",
|
||
"timestamp": "2025-04-04T13:11:46.513Z",
|
||
"passed": false,
|
||
"duration": 2181,
|
||
"reason": "Expected function bubbleSort(arr) { const n = arr.length; for(let i = 0; i < n; i++) { for(let j = 0; j < n-i-1; j++) { if(arr[j] > arr[j+1]) { [arr[j], arr[j+1]] = [arr[j+1], arr[j]]; } } } return arr; }, but got function bubblesort(arr) {\n let i, j;\n for (i = 0; i < arr.length-1; i++) {\n for (j = 0; j < arr.length-i-1; j++) {\n if (arr[j] > arr[j+1]) {\n let temp = arr[j];\n arr[j] = arr[j+1];\n arr[j+1] = temp;\n }\n }\n }\n return arr;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "bubble_sort_function",
|
||
"prompt": "Generate a JavaScript function that implements bubble sort.\n The function should be named 'bubbleSort' and take one parameter 'arr' (an array of numbers).\n The function should return the sorted array.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function bubbleSort(arr) {\n let sortedArr = [...arr];\n const n = sortedArr.length;\n for (let i = 0; i < n; i++) {\n let swapped = false;\n for (let j = 0; j < n - i - 1; j++) {\n if (sortedArr[j] > sortedArr[j + 1]) {\n let temp = sortedArr[j];\n sortedArr[j] = sortedArr[j + 1];\n sortedArr[j + 1] = temp;\n swapped = true;\n }\n }\n if (!swapped) break;\n }\n return sortedArr;\n}"
|
||
],
|
||
"expected": "function bubbleSort(arr) { const n = arr.length; for(let i = 0; i < n; i++) { for(let j = 0; j < n-i-1; j++) { if(arr[j] > arr[j+1]) { [arr[j], arr[j+1]] = [arr[j+1], arr[j]]; } } } return arr; }",
|
||
"model": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"router": "deepseek/deepseek-r1-distill-qwen-14b:free",
|
||
"timestamp": "2025-04-04T13:12:01.405Z",
|
||
"passed": false,
|
||
"duration": 14881,
|
||
"reason": "Expected function bubbleSort(arr) { const n = arr.length; for(let i = 0; i < n; i++) { for(let j = 0; j < n-i-1; j++) { if(arr[j] > arr[j+1]) { [arr[j], arr[j+1]] = [arr[j+1], arr[j]]; } } } return arr; }, but got function bubblesort(arr) {\n let sortedarr = [...arr];\n const n = sortedarr.length;\n for (let i = 0; i < n; i++) {\n let swapped = false;\n for (let j = 0; j < n - i - 1; j++) {\n if (sortedarr[j] > sortedarr[j + 1]) {\n let temp = sortedarr[j];\n sortedarr[j] = sortedarr[j + 1];\n sortedarr[j + 1] = temp;\n swapped = true;\n }\n }\n if (!swapped) break;\n }\n return sortedarr;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "bubble_sort_function",
|
||
"prompt": "Generate a JavaScript function that implements bubble sort.\n The function should be named 'bubbleSort' and take one parameter 'arr' (an array of numbers).\n The function should return the sorted array.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function bubbleSort(arr) {\n let n = arr.length;\n for (let i = 0; i < n - 1; i++) {\n for (let j = 0; j < n - 1 - i; j++) {\n if (arr[j] > arr[j + 1]) {\n let temp = arr[j];\n arr[j] = arr[j + 1];\n arr[j + 1] = temp;\n }\n }\n }\n return arr;\n}"
|
||
],
|
||
"expected": "function bubbleSort(arr) { const n = arr.length; for(let i = 0; i < n; i++) { for(let j = 0; j < n-i-1; j++) { if(arr[j] > arr[j+1]) { [arr[j], arr[j+1]] = [arr[j+1], arr[j]]; } } } return arr; }",
|
||
"model": "openai/gpt-4o-mini",
|
||
"router": "openai/gpt-4o-mini",
|
||
"timestamp": "2025-04-04T13:12:04.108Z",
|
||
"passed": false,
|
||
"duration": 2692,
|
||
"reason": "Expected function bubbleSort(arr) { const n = arr.length; for(let i = 0; i < n; i++) { for(let j = 0; j < n-i-1; j++) { if(arr[j] > arr[j+1]) { [arr[j], arr[j+1]] = [arr[j+1], arr[j]]; } } } return arr; }, but got function bubblesort(arr) {\n let n = arr.length;\n for (let i = 0; i < n - 1; i++) {\n for (let j = 0; j < n - 1 - i; j++) {\n if (arr[j] > arr[j + 1]) {\n let temp = arr[j];\n arr[j] = arr[j + 1];\n arr[j + 1] = temp;\n }\n }\n }\n return arr;\n}",
|
||
"category": "coding"
|
||
},
|
||
{
|
||
"test": "bubble_sort_function",
|
||
"prompt": "Generate a JavaScript function that implements bubble sort.\n The function should be named 'bubbleSort' and take one parameter 'arr' (an array of numbers).\n The function should return the sorted array.\n Return only the function code, no explanation.",
|
||
"result": [
|
||
"function bubbleSort(arr) {\n let n = arr.length;\n for (let i = 0; i < n - 1; i++) {\n for (let j = 0; j < n - 1 - i; j++) {\n if (arr[j] > arr[j + 1]) {\n let temp = arr[j];\n arr[j] = arr[j + 1];\n arr[j + 1] = temp;\n }\n }\n }\n return arr;\n}"
|
||
],
|
||
"expected": "function bubbleSort(arr) { const n = arr.length; for(let i = 0; i < n; i++) { for(let j = 0; j < n-i-1; j++) { if(arr[j] > arr[j+1]) { [arr[j], arr[j+1]] = [arr[j+1], arr[j]]; } } } return arr; }",
|
||
"model": "openrouter/quasar-alpha",
|
||
"router": "openrouter/quasar-alpha",
|
||
"timestamp": "2025-04-04T13:12:05.773Z",
|
||
"passed": false,
|
||
"duration": 1657,
|
||
"reason": "Expected function bubbleSort(arr) { const n = arr.length; for(let i = 0; i < n; i++) { for(let j = 0; j < n-i-1; j++) { if(arr[j] > arr[j+1]) { [arr[j], arr[j+1]] = [arr[j+1], arr[j]]; } } } return arr; }, but got function bubblesort(arr) {\n let n = arr.length;\n for (let i = 0; i < n - 1; i++) {\n for (let j = 0; j < n - 1 - i; j++) {\n if (arr[j] > arr[j + 1]) {\n let temp = arr[j];\n arr[j] = arr[j + 1];\n arr[j + 1] = temp;\n }\n }\n }\n return arr;\n}",
|
||
"category": "coding"
|
||
}
|
||
],
|
||
"highscores": [
|
||
{
|
||
"test": "quadratic",
|
||
"rankings": [
|
||
{
|
||
"model": "openai/gpt-4o-mini",
|
||
"duration": 943,
|
||
"duration_secs": 0.943
|
||
},
|
||
{
|
||
"model": "openrouter/quasar-alpha",
|
||
"duration": 1105,
|
||
"duration_secs": 1.105
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "factorial",
|
||
"rankings": [
|
||
{
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"duration": 838,
|
||
"duration_secs": 0.838
|
||
},
|
||
{
|
||
"model": "openrouter/quasar-alpha",
|
||
"duration": 840,
|
||
"duration_secs": 0.84
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "fibonacci",
|
||
"rankings": [
|
||
{
|
||
"model": "openrouter/quasar-alpha",
|
||
"duration": 701,
|
||
"duration_secs": 0.701
|
||
},
|
||
{
|
||
"model": "openai/gpt-4o-mini",
|
||
"duration": 935,
|
||
"duration_secs": 0.935
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "square_root",
|
||
"rankings": [
|
||
{
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"duration": 793,
|
||
"duration_secs": 0.793
|
||
},
|
||
{
|
||
"model": "anthropic/claude-3.5-sonnet",
|
||
"duration": 819,
|
||
"duration_secs": 0.819
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "power",
|
||
"rankings": [
|
||
{
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"duration": 922,
|
||
"duration_secs": 0.922
|
||
},
|
||
{
|
||
"model": "openai/gpt-4o-mini",
|
||
"duration": 1004,
|
||
"duration_secs": 1.004
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "addition",
|
||
"rankings": [
|
||
{
|
||
"model": "openrouter/quasar-alpha",
|
||
"duration": 811,
|
||
"duration_secs": 0.811
|
||
},
|
||
{
|
||
"model": "openai/gpt-4o-mini",
|
||
"duration": 842,
|
||
"duration_secs": 0.842
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "multiplication",
|
||
"rankings": [
|
||
{
|
||
"model": "openrouter/quasar-alpha",
|
||
"duration": 780,
|
||
"duration_secs": 0.78
|
||
},
|
||
{
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"duration": 881,
|
||
"duration_secs": 0.881
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "division",
|
||
"rankings": [
|
||
{
|
||
"model": "openrouter/quasar-alpha",
|
||
"duration": 731,
|
||
"duration_secs": 0.731
|
||
},
|
||
{
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"duration": 784,
|
||
"duration_secs": 0.784
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "seo_keywords_text",
|
||
"rankings": [
|
||
{
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"duration": 1002,
|
||
"duration_secs": 1.002
|
||
},
|
||
{
|
||
"model": "openai/gpt-4o-mini",
|
||
"duration": 1539,
|
||
"duration_secs": 1.539
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "seo_keywords_technical",
|
||
"rankings": [
|
||
{
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"duration": 881,
|
||
"duration_secs": 0.881
|
||
},
|
||
{
|
||
"model": "openai/gpt-4o-mini",
|
||
"duration": 1694,
|
||
"duration_secs": 1.694
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "equation_solving",
|
||
"rankings": [
|
||
{
|
||
"model": "openai/gpt-4o",
|
||
"duration": 4181,
|
||
"duration_secs": 4.181
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "file_operations",
|
||
"rankings": [
|
||
{
|
||
"model": "openai/gpt-4o",
|
||
"duration": 7243,
|
||
"duration_secs": 7.243
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "directory_listing",
|
||
"rankings": [
|
||
{
|
||
"model": "openai/gpt-4o",
|
||
"duration": 2274,
|
||
"duration_secs": 2.274
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "simple_function",
|
||
"rankings": [
|
||
{
|
||
"model": "openai/gpt-4o-mini",
|
||
"duration": 1420,
|
||
"duration_secs": 1.42
|
||
},
|
||
{
|
||
"model": "openrouter/quasar-alpha",
|
||
"duration": 1425,
|
||
"duration_secs": 1.425
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "factorial_function",
|
||
"rankings": [
|
||
{
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"duration": 1633,
|
||
"duration_secs": 1.633
|
||
},
|
||
{
|
||
"model": "openai/gpt-4o-mini",
|
||
"duration": 2574,
|
||
"duration_secs": 2.574
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "fibonacci_function",
|
||
"rankings": [
|
||
{
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"duration": 1198,
|
||
"duration_secs": 1.198
|
||
},
|
||
{
|
||
"model": "openrouter/quasar-alpha",
|
||
"duration": 1287,
|
||
"duration_secs": 1.287
|
||
}
|
||
]
|
||
},
|
||
{
|
||
"test": "bubble_sort_function",
|
||
"rankings": [
|
||
{
|
||
"model": "openrouter/quasar-alpha",
|
||
"duration": 1657,
|
||
"duration_secs": 1.657
|
||
},
|
||
{
|
||
"model": "openai/gpt-3.5-turbo",
|
||
"duration": 2181,
|
||
"duration_secs": 2.181
|
||
}
|
||
]
|
||
}
|
||
],
|
||
"lastUpdated": "2025-04-04T13:12:05.778Z"
|
||
} |