feat: improve dedup with jina embeddings

This commit is contained in:
Han Xiao 2025-02-07 16:09:19 +08:00
parent f1b37c4f34
commit 5e80ed40ea

View File

@ -3,7 +3,7 @@ import { TokenTracker } from "../utils/token-tracker";
import {JINA_API_KEY} from "../config";
const JINA_API_URL = 'https://api.jina.ai/v1/embeddings';
const SIMILARITY_THRESHOLD = 0.95; // Adjustable threshold for cosine similarity
const SIMILARITY_THRESHOLD = 0.90; // Adjustable threshold for cosine similarity
// Types for Jina API
interface JinaEmbeddingRequest {