530 lines
14 KiB
JSON
530 lines
14 KiB
JSON
[
|
|
{
|
|
"test": "german_translation",
|
|
"prompt": "translate \"hello\" to German. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Hallo"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:50:01.527Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german_translation",
|
|
"prompt": "translate \"hello\" to German. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Hallo\n"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "google/gemini-2.0-flash-exp:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:50:03.169Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german_translation",
|
|
"prompt": "translate \"hello\" to German. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Hallo"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:50:04.655Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish_translation",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translation, no explanation.",
|
|
"result": [
|
|
"sí"
|
|
],
|
|
"expected": "sí",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:50:05.726Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish_translation",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translation, no explanation.",
|
|
"result": [
|
|
"sí\n"
|
|
],
|
|
"expected": "sí",
|
|
"model": "google/gemini-2.0-flash-exp:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:50:08.264Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish_translation",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translation, no explanation.",
|
|
"result": [
|
|
"sí"
|
|
],
|
|
"expected": "sí",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:50:09.514Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "french_translation",
|
|
"prompt": "translate \"no\" to French. Return only the translation, no explanation.",
|
|
"result": [
|
|
"non"
|
|
],
|
|
"expected": "non",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:50:11.281Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "french_translation",
|
|
"prompt": "translate \"no\" to French. Return only the translation, no explanation.",
|
|
"result": [
|
|
"non\n"
|
|
],
|
|
"expected": "non",
|
|
"model": "google/gemini-2.0-flash-exp:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:50:12.942Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "french_translation",
|
|
"prompt": "translate \"no\" to French. Return only the translation, no explanation.",
|
|
"result": [
|
|
"non"
|
|
],
|
|
"expected": "non",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:50:14.089Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german_translation",
|
|
"prompt": "translate \"hello\" to German. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Hallo"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:51:53.360Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german_translation",
|
|
"prompt": "translate \"hello\" to German. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Hallo\n"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "google/gemini-2.0-flash-exp:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:51:54.551Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german_translation",
|
|
"prompt": "translate \"hello\" to German. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Hallo"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:51:55.699Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish_translation",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translation, no explanation.",
|
|
"result": [
|
|
"sí"
|
|
],
|
|
"expected": "sí",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:51:56.740Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish_translation",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Sí\n"
|
|
],
|
|
"expected": "sí",
|
|
"model": "google/gemini-2.0-flash-exp:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:51:57.918Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish_translation",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Sí"
|
|
],
|
|
"expected": "sí",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:51:58.882Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "french_translation",
|
|
"prompt": "translate \"no\" to French. Return only the translation, no explanation.",
|
|
"result": [
|
|
"non"
|
|
],
|
|
"expected": "non",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:52:00.119Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "french_translation",
|
|
"prompt": "translate \"no\" to French. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Non\n"
|
|
],
|
|
"expected": "non",
|
|
"model": "google/gemini-2.0-flash-exp:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:52:01.184Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "french_translation",
|
|
"prompt": "translate \"no\" to French. Return only the translation, no explanation.",
|
|
"result": [
|
|
"non"
|
|
],
|
|
"expected": "non",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:52:02.204Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german_translation",
|
|
"prompt": "translate \"hello\" to German. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Hallo"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:53:50.924Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german_translation",
|
|
"prompt": "translate \"hello\" to German. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Hallo\n"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "google/gemini-2.0-flash-exp:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:53:52.477Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german_translation",
|
|
"prompt": "translate \"hello\" to German. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Hallo"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:53:53.546Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish_translation",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translation, no explanation.",
|
|
"result": [
|
|
"sí"
|
|
],
|
|
"expected": "sí",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:53:56.815Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish_translation",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translation, no explanation.",
|
|
"result": [
|
|
"sí"
|
|
],
|
|
"expected": "sí",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:53:58.718Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "french_translation",
|
|
"prompt": "translate \"no\" to French. Return only the translation, no explanation.",
|
|
"result": [
|
|
"non"
|
|
],
|
|
"expected": "non",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:54:01.673Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german_translation",
|
|
"prompt": "translate \"hello\" to German. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Hallo"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:56:01.199Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german_translation",
|
|
"prompt": "translate \"hello\" to German. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Hallo\n"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "google/gemini-2.0-flash-exp:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:56:02.857Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german_translation",
|
|
"prompt": "translate \"hello\" to German. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Hallo"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:56:03.788Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish_translation",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translation, no explanation.",
|
|
"result": [
|
|
"sí"
|
|
],
|
|
"expected": "sí",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:56:05.218Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish_translation",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translation, no explanation.",
|
|
"result": [
|
|
"sí\n"
|
|
],
|
|
"expected": "sí",
|
|
"model": "google/gemini-2.0-flash-exp:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:56:06.317Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish_translation",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translation, no explanation.",
|
|
"result": [
|
|
"sí"
|
|
],
|
|
"expected": "sí",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:56:07.436Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "french_translation",
|
|
"prompt": "translate \"no\" to French. Return only the translation, no explanation.",
|
|
"result": [
|
|
"non"
|
|
],
|
|
"expected": "non",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:56:08.879Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "french_translation",
|
|
"prompt": "translate \"no\" to French. Return only the translation, no explanation.",
|
|
"result": [
|
|
"non\n"
|
|
],
|
|
"expected": "non",
|
|
"model": "google/gemini-2.0-flash-exp:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:56:10.365Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "french_translation",
|
|
"prompt": "translate \"no\" to French. Return only the translation, no explanation.",
|
|
"result": [
|
|
"non"
|
|
],
|
|
"expected": "non",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:56:11.295Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german_translation",
|
|
"prompt": "translate \"hello\" to German. Return only the translation, no explanation.",
|
|
"result": [
|
|
"Hallo"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:56:32.735Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish_translation",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translation, no explanation.",
|
|
"result": [
|
|
"sí"
|
|
],
|
|
"expected": "sí",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:56:35.276Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "french_translation",
|
|
"prompt": "translate \"no\" to French. Return only the translation, no explanation.",
|
|
"result": [
|
|
"non"
|
|
],
|
|
"expected": "non",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:56:37.673Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german",
|
|
"prompt": "translate \"hello\" to German. Return only the translated word, no explanation.",
|
|
"result": [
|
|
"Hallo"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:59:07.944Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german",
|
|
"prompt": "translate \"hello\" to German. Return only the translated word, no explanation.",
|
|
"result": [
|
|
"Hallo\n"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "google/gemini-2.0-flash-exp:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:59:09.471Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "german",
|
|
"prompt": "translate \"hello\" to German. Return only the translated word, no explanation.",
|
|
"result": [
|
|
"Hallo"
|
|
],
|
|
"expected": "hallo",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:59:11.335Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translated word, no explanation.",
|
|
"result": [
|
|
"Sí"
|
|
],
|
|
"expected": "sí",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:59:12.740Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translated word, no explanation.",
|
|
"result": [
|
|
"Sí\n"
|
|
],
|
|
"expected": "sí",
|
|
"model": "google/gemini-2.0-flash-exp:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:59:14.246Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "spanish",
|
|
"prompt": "translate \"yes\" to Spanish. Return only the translated word, no explanation.",
|
|
"result": [
|
|
"sí"
|
|
],
|
|
"expected": "sí",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:59:15.205Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "french",
|
|
"prompt": "translate \"no\" to French. Return only the translated word, no explanation.",
|
|
"result": [
|
|
"non"
|
|
],
|
|
"expected": "non",
|
|
"model": "deepseek/deepseek-chat:free",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:59:18.139Z",
|
|
"passed": true
|
|
},
|
|
{
|
|
"test": "french",
|
|
"prompt": "translate \"no\" to French. Return only the translated word, no explanation.",
|
|
"result": [
|
|
"non"
|
|
],
|
|
"expected": "non",
|
|
"model": "gpt-4",
|
|
"router": "openrouter",
|
|
"timestamp": "2025-04-01T10:59:20.589Z",
|
|
"passed": true
|
|
}
|
|
] |