mirror of
https://github.com/danny-avila/LibreChat.git
synced 2026-06-21 04:31:57 +00:00
- live/completed gauge counts the repaired completion (normalized output), so under-reporting providers don't drop the response from used context - translate static tokenConfig cacheWrite/cacheRead onto the write/read keys getCacheMultiplier reads, so cache tokens bill at the configured rate instead of the prompt-rate fallback - clear the token index and usage atoms when leaving a conversation, so visited histories don't accumulate in memory for the tab's lifetime - wait for startupConfig before mounting the gauge, so a deployment with contextUsage disabled never briefly mounts it or fires the token-config query on first load
253 lines
8.5 KiB
TypeScript
253 lines
8.5 KiB
TypeScript
import {
|
|
ErrorTypes,
|
|
envVarRegex,
|
|
FetchTokenConfig,
|
|
extractEnvVariable,
|
|
} from 'librechat-data-provider';
|
|
import type { TEndpoint } from 'librechat-data-provider';
|
|
import type { AppConfig } from '@librechat/data-schemas';
|
|
import type { BaseInitializeParams, InitializeResultBase, EndpointTokenConfig } from '~/types';
|
|
import { isUserProvided, checkUserKeyExpiry } from '~/utils';
|
|
import { getOpenAIConfig } from '~/endpoints/openai/config';
|
|
import { getCustomEndpointConfig } from '~/app/config';
|
|
import { fetchModels } from '~/endpoints/models';
|
|
import { validateEndpointURL } from '~/auth';
|
|
import { tokenConfigCache } from '~/cache';
|
|
|
|
const { PROXY } = process.env;
|
|
|
|
/**
|
|
* Cache key for an endpoint's fetched token config. User-scoped when the
|
|
* model fetch can resolve per-user: user-provided key/URL, or header
|
|
* templates forwarded against an admin-trusted base URL — making the
|
|
* response, and therefore the derived token config, user-specific.
|
|
*/
|
|
export function getTokenConfigKey(
|
|
endpointConfig: Partial<TEndpoint>,
|
|
endpoint: string,
|
|
userId: string,
|
|
): string {
|
|
const hasTokenConfig = endpointConfig.tokenConfig != null;
|
|
const userProvidesKey = isUserProvided(extractEnvVariable(endpointConfig.apiKey ?? ''));
|
|
const userProvidesURL = isUserProvided(extractEnvVariable(endpointConfig.baseURL ?? ''));
|
|
const willForwardUserScopedHeaders = !!endpointConfig?.headers && !userProvidesURL;
|
|
return !hasTokenConfig && (userProvidesKey || userProvidesURL || willForwardUserScopedHeaders)
|
|
? `${endpoint}:${userId}`
|
|
: endpoint;
|
|
}
|
|
|
|
/**
|
|
* Maps an admin-facing static `tokenConfig` to the billing shape: the UI uses
|
|
* `cacheWrite`/`cacheRead`, but `getCacheMultiplier` indexes `write`/`read`.
|
|
* Adds those keys (preserving the originals) so cache tokens bill at the
|
|
* configured rate instead of the prompt-rate fallback.
|
|
*/
|
|
function toBillingTokenConfig(
|
|
tokenConfig: Record<string, Record<string, number>>,
|
|
): EndpointTokenConfig {
|
|
const result: EndpointTokenConfig = {};
|
|
for (const [model, rates] of Object.entries(tokenConfig)) {
|
|
const mapped = { ...rates } as Record<string, number>;
|
|
if (rates.cacheWrite != null) {
|
|
mapped.write = rates.cacheWrite;
|
|
}
|
|
if (rates.cacheRead != null) {
|
|
mapped.read = rates.cacheRead;
|
|
}
|
|
result[model] = mapped as EndpointTokenConfig[string];
|
|
}
|
|
return result;
|
|
}
|
|
|
|
/**
|
|
* Builds custom options from endpoint configuration
|
|
*/
|
|
function buildCustomOptions(
|
|
endpointConfig: Partial<TEndpoint>,
|
|
appConfig?: AppConfig,
|
|
endpointTokenConfig?: Record<string, unknown>,
|
|
) {
|
|
const customOptions: Record<string, unknown> = {
|
|
headers: endpointConfig.headers,
|
|
addParams: endpointConfig.addParams,
|
|
dropParams: endpointConfig.dropParams,
|
|
customParams: endpointConfig.customParams,
|
|
titleConvo: endpointConfig.titleConvo,
|
|
titleModel: endpointConfig.titleModel,
|
|
modelDisplayLabel: endpointConfig.modelDisplayLabel,
|
|
titleMethod: endpointConfig.titleMethod ?? 'completion',
|
|
directEndpoint: endpointConfig.directEndpoint,
|
|
titleMessageRole: endpointConfig.titleMessageRole,
|
|
streamRate: endpointConfig.streamRate,
|
|
endpointTokenConfig,
|
|
};
|
|
|
|
const allConfig = appConfig?.endpoints?.all;
|
|
if (allConfig) {
|
|
customOptions.streamRate = allConfig.streamRate;
|
|
}
|
|
|
|
return customOptions;
|
|
}
|
|
|
|
/**
|
|
* Initializes a custom endpoint client configuration.
|
|
* This function handles custom endpoints defined in librechat.yaml, including
|
|
* user-provided API keys and URLs.
|
|
*
|
|
* @param params - Configuration parameters
|
|
* @returns Promise resolving to endpoint configuration options
|
|
* @throws Error if config is missing, API key is not provided, or base URL is missing
|
|
*/
|
|
export async function initializeCustom({
|
|
req,
|
|
endpoint,
|
|
model_parameters,
|
|
db,
|
|
}: BaseInitializeParams): Promise<InitializeResultBase> {
|
|
const appConfig = req.config;
|
|
const { key: expiresAt } = req.body;
|
|
|
|
const endpointConfig = getCustomEndpointConfig({
|
|
endpoint,
|
|
appConfig,
|
|
});
|
|
|
|
if (!endpointConfig) {
|
|
throw new Error(`Config not found for the ${endpoint} custom endpoint.`);
|
|
}
|
|
|
|
const CUSTOM_API_KEY = extractEnvVariable(endpointConfig.apiKey ?? '');
|
|
const CUSTOM_BASE_URL = extractEnvVariable(endpointConfig.baseURL ?? '');
|
|
|
|
if (CUSTOM_API_KEY.match(envVarRegex)) {
|
|
throw new Error(`Missing API Key for ${endpoint}.`);
|
|
}
|
|
|
|
if (CUSTOM_BASE_URL.match(envVarRegex)) {
|
|
throw new Error(`Missing Base URL for ${endpoint}.`);
|
|
}
|
|
|
|
const userProvidesKey = isUserProvided(CUSTOM_API_KEY);
|
|
const userProvidesURL = isUserProvided(CUSTOM_BASE_URL);
|
|
|
|
// Expiry is only checked when present: the Agents API sends an OpenAI-compatible
|
|
// request body that does not include `key` (the expiry timestamp), so expiresAt
|
|
// will be undefined in that flow. The key is still fetched regardless.
|
|
if (expiresAt && (userProvidesKey || userProvidesURL)) {
|
|
checkUserKeyExpiry(expiresAt, endpoint);
|
|
}
|
|
|
|
let userValues = null;
|
|
if (userProvidesKey || userProvidesURL) {
|
|
userValues = await db.getUserKeyValues({ userId: req.user?.id ?? '', name: endpoint });
|
|
}
|
|
|
|
const apiKey = userProvidesKey ? userValues?.apiKey : CUSTOM_API_KEY;
|
|
const baseURL = userProvidesURL ? userValues?.baseURL : CUSTOM_BASE_URL;
|
|
|
|
if (userProvidesKey && !apiKey) {
|
|
throw new Error(
|
|
JSON.stringify({
|
|
type: ErrorTypes.NO_USER_KEY,
|
|
}),
|
|
);
|
|
}
|
|
|
|
if (userProvidesURL && !baseURL) {
|
|
throw new Error(
|
|
JSON.stringify({
|
|
type: ErrorTypes.NO_BASE_URL,
|
|
}),
|
|
);
|
|
}
|
|
|
|
if (!apiKey) {
|
|
throw new Error(`${endpoint} API key not provided.`);
|
|
}
|
|
|
|
if (!baseURL) {
|
|
throw new Error(`${endpoint} Base URL not provided.`);
|
|
}
|
|
|
|
if (userProvidesURL) {
|
|
await validateEndpointURL(baseURL, endpoint, appConfig?.endpoints?.allowedAddresses);
|
|
}
|
|
|
|
let endpointTokenConfig: EndpointTokenConfig | undefined;
|
|
|
|
const userId = req.user?.id ?? '';
|
|
|
|
const cache = tokenConfigCache();
|
|
const hasTokenConfig = endpointConfig.tokenConfig != null;
|
|
const tokenKey = getTokenConfigKey(endpointConfig, endpoint, userId);
|
|
|
|
if (hasTokenConfig) {
|
|
/** A static override is authoritative — use it for the agent's billing
|
|
* and balance checks, not just the advertised UI token config. Mirror
|
|
* the admin-facing `cacheWrite`/`cacheRead` keys onto the `write`/`read`
|
|
* keys the billing multiplier reads. */
|
|
endpointTokenConfig = toBillingTokenConfig(
|
|
endpointConfig.tokenConfig as Record<string, Record<string, number>>,
|
|
);
|
|
} else {
|
|
const cachedConfig =
|
|
FetchTokenConfig[endpoint.toLowerCase() as keyof typeof FetchTokenConfig] &&
|
|
(await cache.get(tokenKey));
|
|
endpointTokenConfig = (cachedConfig as EndpointTokenConfig) || undefined;
|
|
}
|
|
|
|
if (
|
|
FetchTokenConfig[endpoint.toLowerCase() as keyof typeof FetchTokenConfig] &&
|
|
endpointConfig &&
|
|
endpointConfig.models?.fetch &&
|
|
!endpointTokenConfig
|
|
) {
|
|
await fetchModels({
|
|
apiKey,
|
|
baseURL,
|
|
name: endpoint,
|
|
user: userId,
|
|
tokenKey,
|
|
userObject: req.user,
|
|
// Mirror the security guard in `loadConfigModels`: never forward
|
|
// header overrides when the base URL is user-supplied — configured
|
|
// templates like {{LIBRECHAT_OPENID_ID_TOKEN}} would otherwise resolve
|
|
// and leak the user's identity token to a destination the user controls.
|
|
headers: userProvidesURL ? undefined : endpointConfig.headers,
|
|
// Note: when both `headers` and `userObject` are supplied below, the
|
|
// MODEL_QUERIES cache inside `fetchModels` is automatically skipped,
|
|
// which prevents a per-user filtered model list from leaking across
|
|
// users. The token-config cache key (`tokenKey`) is also user-scoped
|
|
// above when these headers will be forwarded.
|
|
});
|
|
endpointTokenConfig = (await cache.get(tokenKey)) as EndpointTokenConfig | undefined;
|
|
}
|
|
|
|
const customOptions = buildCustomOptions(endpointConfig, appConfig, endpointTokenConfig);
|
|
|
|
const clientOptions: Record<string, unknown> = {
|
|
reverseProxyUrl: baseURL ?? null,
|
|
proxy: PROXY ?? null,
|
|
...customOptions,
|
|
};
|
|
|
|
const modelOptions = { ...(model_parameters ?? {}), user: userId };
|
|
const finalClientOptions = {
|
|
modelOptions,
|
|
...clientOptions,
|
|
};
|
|
|
|
const options = getOpenAIConfig(apiKey, finalClientOptions, endpoint);
|
|
if (options != null) {
|
|
(options as InitializeResultBase).useLegacyContent = true;
|
|
(options as InitializeResultBase).endpointTokenConfig = endpointTokenConfig;
|
|
}
|
|
|
|
const streamRate = clientOptions.streamRate as number | undefined;
|
|
if (streamRate) {
|
|
(options.llmConfig as Record<string, unknown>)._lc_stream_delay = streamRate;
|
|
}
|
|
|
|
return options;
|
|
}
|