FastGPT/packages/service/core/ai/rerank/index.ts
Archer 463b02d127
Some checks are pending
Document deploy / sync-images (push) Waiting to run
Document deploy / generate-timestamp (push) Blocked by required conditions
Document deploy / build-images (map[domain:https://fastgpt.cn suffix:cn]) (push) Blocked by required conditions
Document deploy / build-images (map[domain:https://fastgpt.io suffix:io]) (push) Blocked by required conditions
Document deploy / update-images (map[deployment:fastgpt-docs domain:https://fastgpt.cn kube_config:KUBE_CONFIG_CN suffix:cn]) (push) Blocked by required conditions
Document deploy / update-images (map[deployment:fastgpt-docs domain:https://fastgpt.io kube_config:KUBE_CONFIG_IO suffix:io]) (push) Blocked by required conditions
Build FastGPT images in Personal warehouse / get-vars (push) Waiting to run
Build FastGPT images in Personal warehouse / build-fastgpt-images (map[arch:amd64 runs-on:ubuntu-24.04]) (push) Blocked by required conditions
Build FastGPT images in Personal warehouse / build-fastgpt-images (map[arch:arm64 runs-on:ubuntu-24.04-arm]) (push) Blocked by required conditions
Build FastGPT images in Personal warehouse / release-fastgpt-images (push) Blocked by required conditions
perf log (#6107)
* perf: html2md

* perf: index

* Add model log

* update next version

* log index
2025-12-17 17:44:38 +08:00

89 lines
2.2 KiB
TypeScript

import { addLog } from '../../../common/system/log';
import { POST } from '../../../common/api/serverRequest';
import { getDefaultRerankModel } from '../model';
import { getAxiosConfig } from '../config';
import { type RerankModelItemType } from '@fastgpt/global/core/ai/model.d';
import { countPromptTokens } from '../../../common/string/tiktoken';
type PostReRankResponse = {
id: string;
results: {
index: number;
relevance_score: number;
}[];
meta?: {
tokens: {
input_tokens: number;
output_tokens: number;
};
};
};
type ReRankCallResult = {
results: { id: string; score?: number }[];
inputTokens: number;
};
export function reRankRecall({
model = getDefaultRerankModel(),
query,
documents,
headers
}: {
model?: RerankModelItemType;
query: string;
documents: { id: string; text: string }[];
headers?: Record<string, string>;
}): Promise<ReRankCallResult> {
if (!model) {
return Promise.reject('[Rerank] No rerank model');
}
if (documents.length === 0) {
return Promise.resolve({
results: [],
inputTokens: 0
});
}
const { baseUrl, authorization } = getAxiosConfig();
let start = Date.now();
const documentsTextArray = documents.map((doc) => doc.text);
return POST<PostReRankResponse>(
model.requestUrl ? model.requestUrl : `${baseUrl}/rerank`,
{
model: model.model,
query,
documents: documentsTextArray
},
{
headers: {
Authorization: model.requestAuth ? `Bearer ${model.requestAuth}` : authorization,
...headers
},
timeout: 30000
}
)
.then(async (data) => {
addLog.info('ReRank finish:', { time: Date.now() - start });
if (!data?.results || data?.results?.length === 0) {
addLog.error('[Rerank] Empty result', { data });
}
return {
results: data?.results?.map((item) => ({
id: documents[item.index].id,
score: item.relevance_score
})),
inputTokens:
data?.meta?.tokens?.input_tokens ||
(await countPromptTokens(documentsTextArray.join('\n') + query, ''))
};
})
.catch((err) => {
addLog.error('[Rerank] request error', err);
return Promise.reject(err);
});
}