src / services / rag / reranker.js

"use strict";
// We cannot use static imports for ESM-only modules in a CJS environment.
// We must use dynamic imports and 'any' types for the library objects.
var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
    if (k2 === undefined) k2 = k;
    var desc = Object.getOwnPropertyDescriptor(m, k);
    if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) {
      desc = { enumerable: true, get: function() { return m[k]; } };
    }
    Object.defineProperty(o, k2, desc);
}) : (function(o, m, k, k2) {
    if (k2 === undefined) k2 = k;
    o[k2] = m[k];
}));
var __setModuleDefault = (this && this.__setModuleDefault) || (Object.create ? (function(o, v) {
    Object.defineProperty(o, "default", { enumerable: true, value: v });
}) : function(o, v) {
    o["default"] = v;
});
var __importStar = (this && this.__importStar) || (function () {
    var ownKeys = function(o) {
        ownKeys = Object.getOwnPropertyNames || function (o) {
            var ar = [];
            for (var k in o) if (Object.prototype.hasOwnProperty.call(o, k)) ar[ar.length] = k;
            return ar;
        };
        return ownKeys(o);
    };
    return function (mod) {
        if (mod && mod.__esModule) return mod;
        var result = {};
        if (mod != null) for (var k = ownKeys(mod), i = 0; i < k.length; i++) if (k[i] !== "default") __createBinding(result, mod, k[i]);
        __setModuleDefault(result, mod);
        return result;
    };
})();
Object.defineProperty(exports, "__esModule", { value: true });
exports.loadReranker = loadReranker;
exports.rerank = rerank;
let transformers = null;
let tokenizer = null;
let model = null;
const MODEL_ID = 'Xenova/bge-reranker-base';
async function getTransformers() {
    if (!transformers) {
        // Dynamic import to bypass ERR_REQUIRE_ESM
        transformers = await Promise.resolve().then(() => __importStar(require('@xenova/transformers')));
        // Configure environment
        transformers.env.allowLocalModels = false; // Force download/cache usage
        transformers.env.useBrowserCache = true;
    }
    return transformers;
}
async function loadReranker() {
    if (!tokenizer || !model) {
        console.log("Loading Reranker Model (this may take a while on first run)...");
        const { AutoTokenizer, AutoModelForSequenceClassification } = await getTransformers();
        tokenizer = await AutoTokenizer.from_pretrained(MODEL_ID);
        model = await AutoModelForSequenceClassification.from_pretrained(MODEL_ID);
        console.log("Reranker Model Loaded.");
    }
}
async function rerank(query, documents) {
    await loadReranker();
    if (!tokenizer || !model)
        throw new Error("Model failed to load");
    // Construct pairs: [query, doc1], [query, doc2], ...
    const queries = new Array(documents.length).fill(query);
    // Batch processing
    const inputs = await tokenizer(queries, {
        text_pair: documents,
        padding: true,
        truncation: true
    });
    const output = await model(inputs);
    // Sigmoid to get 0-1 scores
    const scores = output.logits.sigmoid().data;
    // Map back to indices
    const results = [];
    for (let i = 0; i < scores.length; i++) {
        results.push({ index: i, score: scores[i] });
    }
    // Sort descending
    results.sort((a, b) => b.score - a.score);
    return results;
}