mirror of
https://github.com/jina-ai/node-DeepResearch.git
synced 2025-12-26 06:28:56 +08:00
fix: unnecessary eval
This commit is contained in:
parent
023bf0ef9c
commit
c5900ac767
@ -38,24 +38,6 @@ Could you please evaluate my answer based on your knowledge and strict standards
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
function getAttributionPrompt(question: string, answer: string, allKnowledge: KnowledgeItem[]): PromptPair {
|
|
||||||
return {
|
|
||||||
system: `You are an evaluator that verifies if answer content is properly attributed to and supported by the provided context.`,
|
|
||||||
user: `
|
|
||||||
<context>
|
|
||||||
${JSON.stringify(allKnowledge)}
|
|
||||||
</context>
|
|
||||||
<question>
|
|
||||||
${question}
|
|
||||||
</question>
|
|
||||||
<answer>
|
|
||||||
${answer}
|
|
||||||
</answer>
|
|
||||||
|
|
||||||
Please read and think.
|
|
||||||
`
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
function getDefinitivePrompt(question: string, answer: string): PromptPair {
|
function getDefinitivePrompt(question: string, answer: string): PromptPair {
|
||||||
return {
|
return {
|
||||||
|
|||||||
@ -6,16 +6,19 @@ import {Schemas} from "../utils/schemas";
|
|||||||
export async function cherryPick(question: string, longContext: string, options: any = {}, trackers: TrackerContext, schemaGen: Schemas, url: string) {
|
export async function cherryPick(question: string, longContext: string, options: any = {}, trackers: TrackerContext, schemaGen: Schemas, url: string) {
|
||||||
|
|
||||||
const {
|
const {
|
||||||
snippetLength = 3000,
|
snippetLength = 3000, // char length of each snippet
|
||||||
numSnippets = Math.max(2, Math.min(5, Math.floor(longContext.length / snippetLength))),
|
numSnippets = Math.max(2, Math.min(5, Math.floor(longContext.length / snippetLength))),
|
||||||
chunkSize = 300,
|
chunkSize = 300, // char length of each chunk
|
||||||
maxTokensPerRequest = 8192, // Maximum tokens per embedding request
|
|
||||||
// Rough estimate of tokens per character (can be adjusted based on your text)
|
|
||||||
tokensPerCharacter = 0.4
|
|
||||||
} = options;
|
} = options;
|
||||||
|
|
||||||
|
const maxTokensPerRequest = 8192 // Maximum tokens per embedding request
|
||||||
|
|
||||||
|
// Rough estimate of tokens per character (can be adjusted based on your text)
|
||||||
|
const tokensPerCharacter = 0.4
|
||||||
|
|
||||||
if (longContext.length < snippetLength * 2) {
|
if (longContext.length < snippetLength * 2) {
|
||||||
// If the context is shorter than the snippet length, return the whole context
|
// If the context is shorter than the snippet length, return the whole context
|
||||||
|
console.log('content is too short, dont bother')
|
||||||
return longContext;
|
return longContext;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -30,6 +33,10 @@ export async function cherryPick(question: string, longContext: string, options:
|
|||||||
trackers.actionTracker.trackThink('late_chunk', schemaGen.languageCode, {url});
|
trackers.actionTracker.trackThink('late_chunk', schemaGen.languageCode, {url});
|
||||||
|
|
||||||
try {
|
try {
|
||||||
|
if (question.trim().length === 0) {
|
||||||
|
throw new Error('Empty question, returning full context');
|
||||||
|
}
|
||||||
|
|
||||||
// Estimate the number of tokens per chunk
|
// Estimate the number of tokens per chunk
|
||||||
const estimatedTokensPerChunk = Math.ceil(chunkSize * tokensPerCharacter);
|
const estimatedTokensPerChunk = Math.ceil(chunkSize * tokensPerCharacter);
|
||||||
|
|
||||||
@ -180,11 +187,11 @@ export async function cherryPick(question: string, longContext: string, options:
|
|||||||
|
|
||||||
// wrap with <snippet-index> tag
|
// wrap with <snippet-index> tag
|
||||||
return snippets.map((snippet, index) => `
|
return snippets.map((snippet, index) => `
|
||||||
<snippet-${index+1}>
|
<snippet-${index + 1}>
|
||||||
|
|
||||||
${snippet}
|
${snippet}
|
||||||
|
|
||||||
</snippet-${index+1}>`.trim()).join("\n\n");
|
</snippet-${index + 1}>`.trim()).join("\n\n");
|
||||||
|
|
||||||
} catch (error) {
|
} catch (error) {
|
||||||
console.error('Error in late chunking:', error);
|
console.error('Error in late chunking:', error);
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user