feat: improve dedup with jina embeddings

This commit is contained in:
Han Xiao 2025-02-07 16:09:05 +08:00
parent 2b218717ae
commit f1b37c4f34

View File

@ -3,7 +3,7 @@ import { TokenTracker } from "../utils/token-tracker";
import {JINA_API_KEY} from "../config";
const JINA_API_URL = 'https://api.jina.ai/v1/embeddings';
const SIMILARITY_THRESHOLD = 0.85; // Adjustable threshold for cosine similarity
const SIMILARITY_THRESHOLD = 0.95; // Adjustable threshold for cosine similarity
// Types for Jina API
interface JinaEmbeddingRequest {