LibreChat/packages/api/src/endpoints/custom/initialize.ts

315 lines
11 KiB
TypeScript

import { Providers } from '@librechat/agents';
import {
ErrorTypes,
envVarRegex,
EModelEndpoint,
FetchTokenConfig,
extractEnvVariable,
} from 'librechat-data-provider';
import type { TEndpoint } from 'librechat-data-provider';
import type { AppConfig } from '@librechat/data-schemas';
import type {
BaseInitializeParams,
InitializeResultBase,
EndpointTokenConfig,
AnthropicModelOptions,
} from '~/types';
import { getLLMConfig as getAnthropicLLMConfig } from '~/endpoints/anthropic/llm';
import { extractDefaultParams } from '~/endpoints/openai/llm';
import { isUserProvided, checkUserKeyExpiry } from '~/utils';
import { getOpenAIConfig } from '~/endpoints/openai/config';
import { getCustomEndpointConfig } from '~/app/config';
import { fetchModels } from '~/endpoints/models';
import { validateEndpointURL } from '~/auth';
import { tokenConfigCache } from '~/cache';
const { PROXY } = process.env;
/**
* Cache key for an endpoint's fetched token config. User-scoped when the
* model fetch can resolve per-user: user-provided key/URL, or header
* templates forwarded against an admin-trusted base URL — making the
* response, and therefore the derived token config, user-specific.
*/
export function getTokenConfigKey(
endpointConfig: Partial<TEndpoint>,
endpoint: string,
userId: string,
): string {
const hasTokenConfig = endpointConfig.tokenConfig != null;
const userProvidesKey = isUserProvided(extractEnvVariable(endpointConfig.apiKey ?? ''));
const userProvidesURL = isUserProvided(extractEnvVariable(endpointConfig.baseURL ?? ''));
const willForwardUserScopedHeaders = !!endpointConfig?.headers && !userProvidesURL;
return !hasTokenConfig && (userProvidesKey || userProvidesURL || willForwardUserScopedHeaders)
? `${endpoint}:${userId}`
: endpoint;
}
/**
* Maps an admin-facing static `tokenConfig` to the billing shape: the UI uses
* `cacheWrite`/`cacheRead`, but `getCacheMultiplier` indexes `write`/`read`.
* Adds those keys (preserving the originals) so cache tokens bill at the
* configured rate instead of the prompt-rate fallback.
*/
function toBillingTokenConfig(
tokenConfig: Record<string, Record<string, number>>,
): EndpointTokenConfig {
const result: EndpointTokenConfig = {};
for (const [model, rates] of Object.entries(tokenConfig)) {
const mapped = { ...rates } as Record<string, number>;
if (rates.cacheWrite != null) {
mapped.write = rates.cacheWrite;
}
if (rates.cacheRead != null) {
mapped.read = rates.cacheRead;
}
result[model] = mapped as EndpointTokenConfig[string];
}
return result;
}
/**
* Builds custom options from endpoint configuration
*/
function buildCustomOptions(
endpointConfig: Partial<TEndpoint>,
appConfig?: AppConfig,
endpointTokenConfig?: Record<string, unknown>,
) {
const customOptions: Record<string, unknown> = {
headers: endpointConfig.headers,
addParams: endpointConfig.addParams,
dropParams: endpointConfig.dropParams,
customParams: endpointConfig.customParams,
titleConvo: endpointConfig.titleConvo,
titleModel: endpointConfig.titleModel,
modelDisplayLabel: endpointConfig.modelDisplayLabel,
titleMethod: endpointConfig.titleMethod ?? 'completion',
directEndpoint: endpointConfig.directEndpoint,
titleMessageRole: endpointConfig.titleMessageRole,
streamRate: endpointConfig.streamRate,
endpointTokenConfig,
};
const allConfig = appConfig?.endpoints?.all;
if (allConfig) {
customOptions.streamRate = allConfig.streamRate;
}
return customOptions;
}
/**
* Builds a native Anthropic (`/v1/messages`) config for a custom endpoint that
* declares `provider: anthropic`, pointing the Anthropic client at the custom
* `baseURL`/`apiKey`. Returns `provider: anthropic` so the agent uses the native
* Anthropic client instead of the OpenAI-compatible one. Headers stay unresolved
* here and resolve at request time via `resolveConfigHeaders`.
*/
function buildAnthropicCustomConfig({
apiKey,
baseURL,
modelOptions,
endpointConfig,
userProvidesURL,
}: {
apiKey: string;
baseURL: string;
modelOptions: AnthropicModelOptions;
endpointConfig: Partial<TEndpoint>;
userProvidesURL: boolean;
}): InitializeResultBase {
const result = getAnthropicLLMConfig(apiKey, {
modelOptions,
proxy: PROXY ?? undefined,
reverseProxyUrl: baseURL,
headers: userProvidesURL ? undefined : endpointConfig.headers,
addParams: endpointConfig.addParams,
dropParams: endpointConfig.dropParams,
/** Apply admin `customParams.paramDefinitions` defaults (e.g. promptCache,
* web_search, thinking) the OpenAI-compatible path gets via `getOpenAIConfig`. */
defaultParams: extractDefaultParams(endpointConfig.customParams?.paramDefinitions),
});
return {
llmConfig: result.llmConfig as InitializeResultBase['llmConfig'],
tools: result.tools,
provider: Providers.ANTHROPIC,
};
}
/**
* Initializes a custom endpoint client configuration.
* This function handles custom endpoints defined in librechat.yaml, including
* user-provided API keys and URLs.
*
* @param params - Configuration parameters
* @returns Promise resolving to endpoint configuration options
* @throws Error if config is missing, API key is not provided, or base URL is missing
*/
export async function initializeCustom({
req,
endpoint,
model_parameters,
db,
}: BaseInitializeParams): Promise<InitializeResultBase> {
const appConfig = req.config;
const { key: expiresAt } = req.body;
const endpointConfig = getCustomEndpointConfig({
endpoint,
appConfig,
});
if (!endpointConfig) {
throw new Error(`Config not found for the ${endpoint} custom endpoint.`);
}
const CUSTOM_API_KEY = extractEnvVariable(endpointConfig.apiKey ?? '');
const CUSTOM_BASE_URL = extractEnvVariable(endpointConfig.baseURL ?? '');
if (CUSTOM_API_KEY.match(envVarRegex)) {
throw new Error(`Missing API Key for ${endpoint}.`);
}
if (CUSTOM_BASE_URL.match(envVarRegex)) {
throw new Error(`Missing Base URL for ${endpoint}.`);
}
const userProvidesKey = isUserProvided(CUSTOM_API_KEY);
const userProvidesURL = isUserProvided(CUSTOM_BASE_URL);
// Expiry is only checked when present: the Agents API sends an OpenAI-compatible
// request body that does not include `key` (the expiry timestamp), so expiresAt
// will be undefined in that flow. The key is still fetched regardless.
if (expiresAt && (userProvidesKey || userProvidesURL)) {
checkUserKeyExpiry(expiresAt, endpoint);
}
let userValues = null;
if (userProvidesKey || userProvidesURL) {
userValues = await db.getUserKeyValues({ userId: req.user?.id ?? '', name: endpoint });
}
const apiKey = userProvidesKey ? userValues?.apiKey : CUSTOM_API_KEY;
const baseURL = userProvidesURL ? userValues?.baseURL : CUSTOM_BASE_URL;
if (userProvidesKey && !apiKey) {
throw new Error(
JSON.stringify({
type: ErrorTypes.NO_USER_KEY,
}),
);
}
if (userProvidesURL && !baseURL) {
throw new Error(
JSON.stringify({
type: ErrorTypes.NO_BASE_URL,
}),
);
}
if (!apiKey) {
throw new Error(`${endpoint} API key not provided.`);
}
if (!baseURL) {
throw new Error(`${endpoint} Base URL not provided.`);
}
if (userProvidesURL) {
await validateEndpointURL(baseURL, endpoint, appConfig?.endpoints?.allowedAddresses);
}
let endpointTokenConfig: EndpointTokenConfig | undefined;
const userId = req.user?.id ?? '';
const cache = tokenConfigCache();
const hasTokenConfig = endpointConfig.tokenConfig != null;
const tokenKey = getTokenConfigKey(endpointConfig, endpoint, userId);
if (hasTokenConfig) {
/** A static override is authoritative — use it for the agent's billing
* and balance checks, not just the advertised UI token config. Mirror
* the admin-facing `cacheWrite`/`cacheRead` keys onto the `write`/`read`
* keys the billing multiplier reads. */
endpointTokenConfig = toBillingTokenConfig(
endpointConfig.tokenConfig as Record<string, Record<string, number>>,
);
} else {
const cachedConfig =
FetchTokenConfig[endpoint.toLowerCase() as keyof typeof FetchTokenConfig] &&
(await cache.get(tokenKey));
endpointTokenConfig = (cachedConfig as EndpointTokenConfig) || undefined;
}
if (
FetchTokenConfig[endpoint.toLowerCase() as keyof typeof FetchTokenConfig] &&
endpointConfig &&
endpointConfig.models?.fetch &&
!endpointTokenConfig
) {
await fetchModels({
apiKey,
baseURL,
name: endpoint,
user: userId,
tokenKey,
userObject: req.user,
// Mirror the security guard in `loadConfigModels`: never forward
// header overrides when the base URL is user-supplied — configured
// templates like {{LIBRECHAT_OPENID_ID_TOKEN}} would otherwise resolve
// and leak the user's identity token to a destination the user controls.
headers: userProvidesURL ? undefined : endpointConfig.headers,
// Note: when both `headers` and `userObject` are supplied below, the
// MODEL_QUERIES cache inside `fetchModels` is automatically skipped,
// which prevents a per-user filtered model list from leaking across
// users. The token-config cache key (`tokenKey`) is also user-scoped
// above when these headers will be forwarded.
});
endpointTokenConfig = (await cache.get(tokenKey)) as EndpointTokenConfig | undefined;
}
const customOptions = buildCustomOptions(endpointConfig, appConfig, endpointTokenConfig);
const clientOptions: Record<string, unknown> = {
reverseProxyUrl: baseURL ?? null,
proxy: PROXY ?? null,
...customOptions,
};
const modelOptions = { ...(model_parameters ?? {}), user: userId };
let options: InitializeResultBase;
if (endpointConfig.provider === EModelEndpoint.anthropic) {
/** Native Anthropic `/v1/messages` client against the custom baseURL/apiKey.
* `useLegacyContent` is intentionally left unset (matches the built-in
* Anthropic endpoint, which uses native content formatting). */
options = buildAnthropicCustomConfig({
apiKey,
baseURL,
modelOptions: modelOptions as AnthropicModelOptions,
endpointConfig,
userProvidesURL,
});
options.endpointTokenConfig = endpointTokenConfig;
} else {
const finalClientOptions = {
modelOptions,
...clientOptions,
};
options = getOpenAIConfig(apiKey, finalClientOptions, endpoint);
if (options != null) {
options.useLegacyContent = true;
options.endpointTokenConfig = endpointTokenConfig;
}
}
const streamRate = clientOptions.streamRate as number | undefined;
if (streamRate) {
(options.llmConfig as Record<string, unknown>)._lc_stream_delay = streamRate;
}
return options;
}