feat: update eval and ego questions

This commit is contained in:
Han Xiao 2025-02-07 11:56:50 +08:00
parent 1168c753ce
commit 4925303c57
2 changed files with 6 additions and 6 deletions

View File

@ -142,7 +142,7 @@ async function batchEvaluate(inputFile: string): Promise<void> {
const {
result: response,
context
} = await getResponse(question, 0) as { result: AnswerAction; context: TrackerContext };
} = await getResponse(question) as { result: AnswerAction; context: TrackerContext };
const actualAnswer = response.answer;
// Evaluate the response

View File

@ -32,7 +32,7 @@
"answer": "four: sunnyvale, berlin, beijing, shenzhen"
},
{
"question": "what jina-colbert-v2 improves over jina-colbert-v1?",
"question": "what exactly jina-colbert-v2 improves over jina-colbert-v1?",
"answer": "v2 add multilingual support"
},
{
@ -40,8 +40,8 @@
"answer": "Andreas Koukounas, Georgios Mastrapas, Bo Wang, Mohammad Kalim Akram, Sedigheh Eslami, Michael Günther, Isabelle Mohr, Saba Sturua, Scott Martens, Nan Wang, Han Xiao"
},
{
"question": "who is the common author of fashion-mnist and node-deepresearch?",
"answer": "Han Xiao"
"question": "who created the node-deepresearch project?",
"answer": "Han Xiao / jina ai"
},
{
"question": "Which countries are the investors of Jina AI from?",
@ -68,8 +68,8 @@
"answer": "Jiao Liu"
},
{
"question": "which llm provider does node-deepresearch project support?",
"answer": "Gemini, Openai and some local LLMs"
"question": "what is the key idea behind node-deepresearch project?",
"answer": "It keeps searching, reading webpages, reasoning until an answer is found."
},
{
"question": "what is the name of the jina ai's mascot?",