chat-ui

Sleeping

App Files Files Community

Galén

nsarrazin commited on Dec 5, 2023

Commit

a1afcb6

unverified ·

1 Parent(s): 2da78f5

Add support for passing an API key or any other custom token in the authorization header (#579)

Browse files

* Add support for passing an API key or any other custom token in the authorization header

* Make linter happy

* Fix README as per linter suggestions

* Refactor endpoints to actually parse zod config

* Remove top level env var and simplify header addition

* Skip section on API key or other, remove obsolete comment in endpointTgi.ts and remote CUSTOM_AUTHORIZATION_TOKEN from .env

---------

Co-authored-by: Nathan Sarrazin <[email protected]>

Files changed (6) hide show

README.md +2 -0
src/lib/server/endpoints/aws/endpointAws.ts +6 -9
src/lib/server/endpoints/llamacpp/endpointLlamacpp.ts +4 -4
src/lib/server/endpoints/ollama/endpointOllama.ts +3 -5
src/lib/server/endpoints/openai/endpointOai.ts +4 -6
src/lib/server/endpoints/tgi/endpointTgi.ts +16 -6

README.md CHANGED Viewed

@@ -397,6 +397,8 @@ You can then add the generated information and the `authorization` parameter to
 ]
 ```
 #### Models hosted on multiple custom endpoints
 If the model being hosted will be available on multiple servers/instances add the `weight` parameter to your `.env.local`. The `weight` will be used to determine the probability of requesting a particular endpoint.

 ]
 ```
+Please note that if `HF_ACCESS_TOKEN` is also set or not empty, it will take precedence.
 #### Models hosted on multiple custom endpoints
 If the model being hosted will be available on multiple servers/instances add the `weight` parameter to your `.env.local`. The `weight` will be used to determine the probability of requesting a particular endpoint.

src/lib/server/endpoints/aws/endpointAws.ts CHANGED Viewed

@@ -15,15 +15,9 @@ export const endpointAwsParametersSchema = z.object({
 	region: z.string().optional(),
 });
-export async function endpointAws({
-	url,
-	accessKey,
-	secretKey,
-	sessionToken,
-	model,
-	region,
-	service,
-}: z.infer<typeof endpointAwsParametersSchema>): Promise<Endpoint> {
 	let AwsClient;
 	try {
 		AwsClient = (await import("aws4fetch")).AwsClient;
@@ -31,6 +25,9 @@ export async function endpointAws({
 		throw new Error("Failed to import aws4fetch");
 	}
 	const aws = new AwsClient({
 		accessKeyId: accessKey,
 		secretAccessKey: secretKey,

 	region: z.string().optional(),
 });
+export async function endpointAws(
+	input: z.input<typeof endpointAwsParametersSchema>
+): Promise<Endpoint> {
 	let AwsClient;
 	try {
 		AwsClient = (await import("aws4fetch")).AwsClient;
 		throw new Error("Failed to import aws4fetch");
 	}
+	const { url, accessKey, secretKey, sessionToken, model, region, service } =
+		endpointAwsParametersSchema.parse(input);
 	const aws = new AwsClient({
 		accessKeyId: accessKey,
 		secretAccessKey: secretKey,

src/lib/server/endpoints/llamacpp/endpointLlamacpp.ts CHANGED Viewed

@@ -12,10 +12,10 @@ export const endpointLlamacppParametersSchema = z.object({
 	accessToken: z.string().min(1).default(HF_ACCESS_TOKEN),
 });
-export function endpointLlamacpp({
-	url,
-	model,
-}: z.infer<typeof endpointLlamacppParametersSchema>): Endpoint {
 	return async ({ conversation }) => {
 		const prompt = await buildPrompt({
 			messages: conversation.messages,

 	accessToken: z.string().min(1).default(HF_ACCESS_TOKEN),
 });
+export function endpointLlamacpp(
+	input: z.input<typeof endpointLlamacppParametersSchema>
+): Endpoint {
+	const { url, model } = endpointLlamacppParametersSchema.parse(input);
 	return async ({ conversation }) => {
 		const prompt = await buildPrompt({
 			messages: conversation.messages,

src/lib/server/endpoints/ollama/endpointOllama.ts CHANGED Viewed

@@ -11,11 +11,9 @@ export const endpointOllamaParametersSchema = z.object({
 	ollamaName: z.string().min(1).optional(),
 });
-export function endpointOllama({
-	url,
-	model,
-	ollamaName,
-}: z.infer<typeof endpointOllamaParametersSchema>): Endpoint {
 	return async ({ conversation }) => {
 		const prompt = await buildPrompt({
 			messages: conversation.messages,

 	ollamaName: z.string().min(1).optional(),
 });
+export function endpointOllama(input: z.input<typeof endpointOllamaParametersSchema>): Endpoint {
+	const { url, model, ollamaName } = endpointOllamaParametersSchema.parse(input);
 	return async ({ conversation }) => {
 		const prompt = await buildPrompt({
 			messages: conversation.messages,

src/lib/server/endpoints/openai/endpointOai.ts CHANGED Viewed

@@ -16,12 +16,10 @@ export const endpointOAIParametersSchema = z.object({
 		.default("chat_completions"),
 });
-export async function endpointOai({
-	baseURL,
-	apiKey,
-	completion,
-	model,
-}: z.infer<typeof endpointOAIParametersSchema>): Promise<Endpoint> {
 	let OpenAI;
 	try {
 		OpenAI = (await import("openai")).OpenAI;

 		.default("chat_completions"),
 });
+export async function endpointOai(
+	input: z.input<typeof endpointOAIParametersSchema>
+): Promise<Endpoint> {
+	const { baseURL, apiKey, completion, model } = endpointOAIParametersSchema.parse(input);
 	let OpenAI;
 	try {
 		OpenAI = (await import("openai")).OpenAI;

src/lib/server/endpoints/tgi/endpointTgi.ts CHANGED Viewed

@@ -10,13 +10,11 @@ export const endpointTgiParametersSchema = z.object({
 	type: z.literal("tgi"),
 	url: z.string().url(),
 	accessToken: z.string().default(HF_ACCESS_TOKEN),
 });
-export function endpointTgi({
-	url,
-	accessToken,
-	model,
-}: z.infer<typeof endpointTgiParametersSchema>): Endpoint {
 	return async ({ conversation }) => {
 		const prompt = await buildPrompt({
 			messages: conversation.messages,
@@ -33,7 +31,19 @@ export function endpointTgi({
 				inputs: prompt,
 				accessToken,
 			},
-			{ use_cache: false }
 		);
 	};
 }

 	type: z.literal("tgi"),
 	url: z.string().url(),
 	accessToken: z.string().default(HF_ACCESS_TOKEN),
+	authorization: z.string().optional(),
 });
+export function endpointTgi(input: z.input<typeof endpointTgiParametersSchema>): Endpoint {
+	const { url, accessToken, model, authorization } = endpointTgiParametersSchema.parse(input);
 	return async ({ conversation }) => {
 		const prompt = await buildPrompt({
 			messages: conversation.messages,
 				inputs: prompt,
 				accessToken,
 			},
+			{
+				use_cache: false,
+				fetch: async (endpointUrl, info) => {
+					if (info && authorization && !accessToken) {
+						// Set authorization header if it is defined and HF_ACCESS_TOKEN is empty
+						info.headers = {
+							...info.headers,
+							Authorization: authorization,
+						};
+					}
+					return fetch(endpointUrl, info);
+				},
+			}
 		);
 	};
 }