Project Files
src / services / rag / reranker.js
"use strict";
// We cannot use static imports for ESM-only modules in a CJS environment.
// We must use dynamic imports and 'any' types for the library objects.
var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
if (k2 === undefined) k2 = k;
var desc = Object.getOwnPropertyDescriptor(m, k);
if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) {
desc = { enumerable: true, get: function() { return m[k]; } };
}
Object.defineProperty(o, k2, desc);
}) : (function(o, m, k, k2) {
if (k2 === undefined) k2 = k;
o[k2] = m[k];
}));
var __setModuleDefault = (this && this.__setModuleDefault) || (Object.create ? (function(o, v) {
Object.defineProperty(o, "default", { enumerable: true, value: v });
}) : function(o, v) {
o["default"] = v;
});
var __importStar = (this && this.__importStar) || (function () {
var ownKeys = function(o) {
ownKeys = Object.getOwnPropertyNames || function (o) {
var ar = [];
for (var k in o) if (Object.prototype.hasOwnProperty.call(o, k)) ar[ar.length] = k;
return ar;
};
return ownKeys(o);
};
return function (mod) {
if (mod && mod.__esModule) return mod;
var result = {};
if (mod != null) for (var k = ownKeys(mod), i = 0; i < k.length; i++) if (k[i] !== "default") __createBinding(result, mod, k[i]);
__setModuleDefault(result, mod);
return result;
};
})();
Object.defineProperty(exports, "__esModule", { value: true });
exports.loadReranker = loadReranker;
exports.rerank = rerank;
let transformers = null;
let tokenizer = null;
let model = null;
const MODEL_ID = 'Xenova/bge-reranker-base';
async function getTransformers() {
if (!transformers) {
// Dynamic import to bypass ERR_REQUIRE_ESM
transformers = await Promise.resolve().then(() => __importStar(require('@xenova/transformers')));
// Configure environment
transformers.env.allowLocalModels = false; // Force download/cache usage
transformers.env.useBrowserCache = true;
}
return transformers;
}
async function loadReranker() {
if (!tokenizer || !model) {
console.log("Loading Reranker Model (this may take a while on first run)...");
const { AutoTokenizer, AutoModelForSequenceClassification } = await getTransformers();
tokenizer = await AutoTokenizer.from_pretrained(MODEL_ID);
model = await AutoModelForSequenceClassification.from_pretrained(MODEL_ID);
console.log("Reranker Model Loaded.");
}
}
async function rerank(query, documents) {
await loadReranker();
if (!tokenizer || !model)
throw new Error("Model failed to load");
// Construct pairs: [query, doc1], [query, doc2], ...
const queries = new Array(documents.length).fill(query);
// Batch processing
const inputs = await tokenizer(queries, {
text_pair: documents,
padding: true,
truncation: true
});
const output = await model(inputs);
// Sigmoid to get 0-1 scores
const scores = output.logits.sigmoid().data;
// Map back to indices
const results = [];
for (let i = 0; i < scores.length; i++) {
results.push({ index: i, score: scores[i] });
}
// Sort descending
results.sort((a, b) => b.score - a.score);
return results;
}