feat: improve dedup with jina embeddings

This commit is contained in:
Han Xiao
2025-02-07 16:39:01 +08:00
parent 5e80ed40ea
commit f9cbc4008c
2 changed files with 12 additions and 12 deletions

View File

@@ -3,7 +3,7 @@ import { TokenTracker } from "../utils/token-tracker";
import {JINA_API_KEY} from "../config";
const JINA_API_URL = 'https://api.jina.ai/v1/embeddings';
const SIMILARITY_THRESHOLD = 0.90; // Adjustable threshold for cosine similarity
const SIMILARITY_THRESHOLD = 0.93; // Adjustable threshold for cosine similarity
// Types for Jina API
interface JinaEmbeddingRequest {