mirror of
https://github.com/Youzini-afk/ST-Bionic-Memory-Ecology.git
synced 2026-05-15 14:20:35 +08:00
427 lines
11 KiB
JavaScript
427 lines
11 KiB
JavaScript
// ST-BME: 外部 Embedding API 封装 + 向量检索
|
||
// 支持 OpenAI 兼容的 /v1/embeddings 接口
|
||
|
||
/**
|
||
* Embedding 服务
|
||
* 调用外部 API 获取文本向量,并提供暴力搜索 cosine 相似度
|
||
*/
|
||
|
||
import { getRequestHeaders } from "../../../../../script.js";
|
||
import { extension_settings } from "../../../../extensions.js";
|
||
import { resolveConfiguredTimeoutMs } from "../runtime/request-timeout.js";
|
||
|
||
const MODULE_NAME = "st_bme";
|
||
const EMBEDDING_REQUEST_TIMEOUT_MS = 300000;
|
||
const BACKEND_SOURCES_REQUIRING_API_URL = new Set([
|
||
"ollama",
|
||
"llamacpp",
|
||
"vllm",
|
||
]);
|
||
|
||
function getEmbeddingTestOverride(name) {
|
||
const override = globalThis.__stBmeTestOverrides?.embedding?.[name];
|
||
return typeof override === "function" ? override : null;
|
||
}
|
||
|
||
function getConfiguredTimeoutMs(
|
||
settings = extension_settings[MODULE_NAME] || {},
|
||
) {
|
||
return typeof resolveConfiguredTimeoutMs === "function"
|
||
? resolveConfiguredTimeoutMs(settings, EMBEDDING_REQUEST_TIMEOUT_MS)
|
||
: (() => {
|
||
const timeoutMs = Number(settings?.timeoutMs);
|
||
return Number.isFinite(timeoutMs) && timeoutMs > 0
|
||
? timeoutMs
|
||
: EMBEDDING_REQUEST_TIMEOUT_MS;
|
||
})();
|
||
}
|
||
|
||
function isAbortError(error) {
|
||
return error?.name === "AbortError";
|
||
}
|
||
|
||
function normalizeOpenAICompatibleBaseUrl(value) {
|
||
return String(value || "")
|
||
.trim()
|
||
.replace(/\/+(chat\/completions|embeddings)$/i, "")
|
||
.replace(/\/+$/, "");
|
||
}
|
||
|
||
function normalizeVector(value) {
|
||
if (!Array.isArray(value)) return null;
|
||
const vector = value.map((item) => Number(item)).filter((item) => Number.isFinite(item));
|
||
return vector.length ? new Float64Array(vector) : null;
|
||
}
|
||
|
||
function readEmbeddingMode(config = {}) {
|
||
return String(config?.embeddingMode || config?.mode || "direct").trim().toLowerCase();
|
||
}
|
||
|
||
function readEmbeddingSource(config = {}) {
|
||
return String(config?.embeddingSource || config?.source || "openai").trim().toLowerCase() || "openai";
|
||
}
|
||
|
||
function buildBackendEmbeddingRequestBody(config = {}, payload = {}) {
|
||
const source = readEmbeddingSource(config);
|
||
const body = {
|
||
source,
|
||
model: String(config?.model || "").trim(),
|
||
isQuery: Boolean(payload.isQuery),
|
||
};
|
||
if (payload.text !== undefined) {
|
||
body.text = String(payload.text ?? "");
|
||
}
|
||
if (Array.isArray(payload.texts)) {
|
||
body.texts = payload.texts.map((item) => String(item ?? ""));
|
||
}
|
||
if (BACKEND_SOURCES_REQUIRING_API_URL.has(source)) {
|
||
body.apiUrl = normalizeOpenAICompatibleBaseUrl(config?.apiUrl);
|
||
}
|
||
if (source === "ollama") {
|
||
body.keep = false;
|
||
}
|
||
return body;
|
||
}
|
||
|
||
async function requestBackendEmbeddings(config = {}, payload = {}, { signal } = {}) {
|
||
const response = await fetchWithTimeout(
|
||
"/api/vector/embed",
|
||
{
|
||
method: "POST",
|
||
headers: {
|
||
...getRequestHeaders(),
|
||
"Content-Type": "application/json",
|
||
},
|
||
signal,
|
||
body: JSON.stringify(buildBackendEmbeddingRequestBody(config, payload)),
|
||
},
|
||
getConfiguredTimeoutMs(config),
|
||
);
|
||
|
||
if (!response.ok) {
|
||
const errorText = await response.text().catch(() => response.statusText);
|
||
console.error(
|
||
`[ST-BME] Backend Embedding API 错误 (${response.status}):`,
|
||
errorText,
|
||
);
|
||
return null;
|
||
}
|
||
|
||
return await response.json().catch(() => ({}));
|
||
}
|
||
|
||
function createCombinedAbortSignal(...signals) {
|
||
const validSignals = signals.filter(Boolean);
|
||
if (validSignals.length <= 1) {
|
||
return validSignals[0] || undefined;
|
||
}
|
||
|
||
if (
|
||
typeof AbortSignal !== "undefined" &&
|
||
typeof AbortSignal.any === "function"
|
||
) {
|
||
return AbortSignal.any(validSignals);
|
||
}
|
||
|
||
const controller = new AbortController();
|
||
for (const signal of validSignals) {
|
||
if (signal.aborted) {
|
||
controller.abort(signal.reason);
|
||
return controller.signal;
|
||
}
|
||
signal.addEventListener("abort", () => controller.abort(signal.reason), {
|
||
once: true,
|
||
});
|
||
}
|
||
return controller.signal;
|
||
}
|
||
|
||
async function fetchWithTimeout(
|
||
url,
|
||
options = {},
|
||
timeoutMs = EMBEDDING_REQUEST_TIMEOUT_MS,
|
||
) {
|
||
const controller = new AbortController();
|
||
const timeout = setTimeout(
|
||
() =>
|
||
controller.abort(
|
||
new DOMException(
|
||
`Embedding 请求超时 (${Math.round(timeoutMs / 1000)}s)`,
|
||
"AbortError",
|
||
),
|
||
),
|
||
timeoutMs,
|
||
);
|
||
const signal = options.signal
|
||
? createCombinedAbortSignal(options.signal, controller.signal)
|
||
: controller.signal;
|
||
|
||
try {
|
||
return await fetch(url, {
|
||
...options,
|
||
signal,
|
||
});
|
||
} finally {
|
||
clearTimeout(timeout);
|
||
}
|
||
}
|
||
|
||
/**
|
||
* 调用外部 Embedding API
|
||
*
|
||
* @param {string} text - 要嵌入的文本
|
||
* @param {object} config - API 配置
|
||
* @param {string} config.apiUrl - API 基地址(如 https://api.openai.com/v1)
|
||
* @param {string} config.apiKey - API Key
|
||
* @param {string} config.model - 模型名(如 text-embedding-3-small)
|
||
* @returns {Promise<Float64Array|null>} 向量或 null
|
||
*/
|
||
export async function embedText(text, config, { signal, isQuery = false } = {}) {
|
||
const override = getEmbeddingTestOverride("embedText");
|
||
if (override) {
|
||
return await override(text, config, { signal, isQuery });
|
||
}
|
||
|
||
if (readEmbeddingMode(config) === "backend") {
|
||
if (!text || !config?.model) {
|
||
console.warn("[ST-BME] Embedding 配置不完整,跳过");
|
||
return null;
|
||
}
|
||
try {
|
||
const payload = await requestBackendEmbeddings(
|
||
config,
|
||
{ text, isQuery },
|
||
{ signal },
|
||
);
|
||
return normalizeVector(payload?.vector);
|
||
} catch (e) {
|
||
if (isAbortError(e)) {
|
||
throw e;
|
||
}
|
||
console.error("[ST-BME] Backend Embedding 调用失败:", e);
|
||
return null;
|
||
}
|
||
}
|
||
|
||
const apiUrl = normalizeOpenAICompatibleBaseUrl(config?.apiUrl);
|
||
if (!text || !apiUrl || !config?.model) {
|
||
console.warn("[ST-BME] Embedding 配置不完整,跳过");
|
||
return null;
|
||
}
|
||
|
||
try {
|
||
const response = await fetchWithTimeout(
|
||
`${apiUrl}/embeddings`,
|
||
{
|
||
method: "POST",
|
||
headers: {
|
||
"Content-Type": "application/json",
|
||
...(config.apiKey
|
||
? { Authorization: `Bearer ${config.apiKey}` }
|
||
: {}),
|
||
},
|
||
signal,
|
||
body: JSON.stringify({
|
||
model: config.model,
|
||
input: text,
|
||
}),
|
||
},
|
||
getConfiguredTimeoutMs(config),
|
||
);
|
||
|
||
if (!response.ok) {
|
||
const errorText = await response.text();
|
||
console.error(
|
||
`[ST-BME] Embedding API 错误 (${response.status}):`,
|
||
errorText,
|
||
);
|
||
return null;
|
||
}
|
||
|
||
const data = await response.json();
|
||
const vector = data?.data?.[0]?.embedding;
|
||
|
||
if (!vector || !Array.isArray(vector)) {
|
||
console.error("[ST-BME] Embedding API 返回格式异常:", data);
|
||
return null;
|
||
}
|
||
|
||
return new Float64Array(vector);
|
||
} catch (e) {
|
||
if (isAbortError(e)) {
|
||
throw e;
|
||
}
|
||
console.error("[ST-BME] Embedding API 调用失败:", e);
|
||
return null;
|
||
}
|
||
}
|
||
|
||
/**
|
||
* 批量嵌入文本
|
||
*
|
||
* @param {string[]} texts
|
||
* @param {object} config
|
||
* @returns {Promise<(Float64Array|null)[]>}
|
||
*/
|
||
export async function embedBatch(texts, config, { signal, isQuery = false } = {}) {
|
||
const override = getEmbeddingTestOverride("embedBatch");
|
||
if (override) {
|
||
return await override(texts, config, { signal, isQuery });
|
||
}
|
||
|
||
if (readEmbeddingMode(config) === "backend") {
|
||
if (!texts.length || !config?.model) {
|
||
return texts.map(() => null);
|
||
}
|
||
try {
|
||
const payload = await requestBackendEmbeddings(
|
||
config,
|
||
{ texts, isQuery },
|
||
{ signal },
|
||
);
|
||
const vectors = Array.isArray(payload?.vectors) ? payload.vectors : [];
|
||
return texts.map((_, index) => normalizeVector(vectors[index]));
|
||
} catch (e) {
|
||
if (isAbortError(e)) {
|
||
throw e;
|
||
}
|
||
console.error("[ST-BME] Backend Embedding 批量调用失败:", e);
|
||
return texts.map(() => null);
|
||
}
|
||
}
|
||
|
||
const apiUrl = normalizeOpenAICompatibleBaseUrl(config?.apiUrl);
|
||
if (!texts.length || !apiUrl || !config?.model) {
|
||
return texts.map(() => null);
|
||
}
|
||
|
||
try {
|
||
const response = await fetchWithTimeout(
|
||
`${apiUrl}/embeddings`,
|
||
{
|
||
method: "POST",
|
||
headers: {
|
||
"Content-Type": "application/json",
|
||
...(config.apiKey
|
||
? { Authorization: `Bearer ${config.apiKey}` }
|
||
: {}),
|
||
},
|
||
signal,
|
||
body: JSON.stringify({
|
||
model: config.model,
|
||
input: texts,
|
||
}),
|
||
},
|
||
getConfiguredTimeoutMs(config),
|
||
);
|
||
|
||
if (!response.ok) {
|
||
const errorText = await response.text();
|
||
console.error(
|
||
`[ST-BME] Embedding API 批量错误 (${response.status}):`,
|
||
errorText,
|
||
);
|
||
return texts.map(() => null);
|
||
}
|
||
|
||
const data = await response.json();
|
||
const embeddings = data?.data;
|
||
|
||
if (!Array.isArray(embeddings)) {
|
||
return texts.map(() => null);
|
||
}
|
||
|
||
// 按 index 排序(API 可能不保证顺序)
|
||
embeddings.sort((a, b) => a.index - b.index);
|
||
|
||
return embeddings.map((item) => {
|
||
if (item?.embedding && Array.isArray(item.embedding)) {
|
||
return new Float64Array(item.embedding);
|
||
}
|
||
return null;
|
||
});
|
||
} catch (e) {
|
||
if (isAbortError(e)) {
|
||
throw e;
|
||
}
|
||
console.error("[ST-BME] Embedding API 批量调用失败:", e);
|
||
return texts.map(() => null);
|
||
}
|
||
}
|
||
|
||
/**
|
||
* 计算两个向量的 cosine 相似度
|
||
*
|
||
* @param {Float64Array|number[]} vecA
|
||
* @param {Float64Array|number[]} vecB
|
||
* @returns {number} 相似度 [-1, 1]
|
||
*/
|
||
export function cosineSimilarity(vecA, vecB) {
|
||
if (!vecA || !vecB || vecA.length !== vecB.length || vecA.length === 0) {
|
||
return 0;
|
||
}
|
||
|
||
let dotProduct = 0;
|
||
let normA = 0;
|
||
let normB = 0;
|
||
|
||
for (let i = 0; i < vecA.length; i++) {
|
||
dotProduct += vecA[i] * vecB[i];
|
||
normA += vecA[i] * vecA[i];
|
||
normB += vecB[i] * vecB[i];
|
||
}
|
||
|
||
const denominator = Math.sqrt(normA) * Math.sqrt(normB);
|
||
if (denominator === 0) return 0;
|
||
|
||
return dotProduct / denominator;
|
||
}
|
||
|
||
/**
|
||
* 暴力搜索:找出与查询向量最相似的 Top-K 节点
|
||
* PeroCore 的向量引擎也是暴力搜索(<1000 节点时比 HNSW 更快)
|
||
*
|
||
* @param {Float64Array|number[]} queryVec - 查询向量
|
||
* @param {Array<{nodeId: string, embedding: Float64Array|number[]}>} candidates - 候选节点
|
||
* @param {number} topK - 返回数量
|
||
* @returns {Array<{nodeId: string, score: number}>} 按相似度降序
|
||
*/
|
||
export function searchSimilar(queryVec, candidates, topK = 20) {
|
||
const override = getEmbeddingTestOverride("searchSimilar");
|
||
if (override) {
|
||
return override(queryVec, candidates, topK);
|
||
}
|
||
|
||
if (!queryVec || candidates.length === 0) return [];
|
||
|
||
const scored = candidates
|
||
.filter((c) => c.embedding && c.embedding.length > 0)
|
||
.map((c) => ({
|
||
nodeId: c.nodeId,
|
||
score: cosineSimilarity(queryVec, c.embedding),
|
||
}))
|
||
.filter((item) => item.score > 0);
|
||
|
||
scored.sort((a, b) => b.score - a.score);
|
||
|
||
return scored.slice(0, topK);
|
||
}
|
||
|
||
/**
|
||
* 测试 Embedding API 连通性
|
||
*
|
||
* @param {object} config - API 配置
|
||
* @returns {Promise<{success: boolean, dimensions: number, error: string}>}
|
||
*/
|
||
export async function testConnection(config) {
|
||
try {
|
||
const vec = await embedText("test connection", config);
|
||
if (vec) {
|
||
return { success: true, dimensions: vec.length, error: "" };
|
||
}
|
||
return { success: false, dimensions: 0, error: "API 返回空结果" };
|
||
} catch (e) {
|
||
return { success: false, dimensions: 0, error: String(e) };
|
||
}
|
||
}
|