chat-ui-energy

Running

App Files Files Community

altbdoor

nsarrazin HF Staff commited on Sep 9, 2024

Commit

dffaafd

unverified ·

1 Parent(s): 96070f4

Move Google GenAI API key to env file instead (#1448)

Browse files

- Updated the documentation with the latest links from Google AI Studio
- Fixed the incorrect documentation on `safetyThreshold`
- Fixed the `safetySettings` to exclude unspecified category, as it is
not considered as a valid input category in Google's API

Co-authored-by: Nathan Sarrazin <[email protected]>

Files changed (3) hide show

.env +1 -0
docs/source/configuration/models/providers/google.md +10 -4
src/lib/server/endpoints/google/endpointGenAI.ts +16 -26

.env CHANGED Viewed

@@ -16,6 +16,7 @@ ANTHROPIC_API_KEY=#your anthropic api key here
 CLOUDFLARE_ACCOUNT_ID=#your cloudflare account id here
 CLOUDFLARE_API_TOKEN=#your cloudflare api token here
 COHERE_API_TOKEN=#your cohere api token here
 HF_ACCESS_TOKEN=#LEGACY! Use HF_TOKEN instead

 CLOUDFLARE_ACCOUNT_ID=#your cloudflare account id here
 CLOUDFLARE_API_TOKEN=#your cloudflare api token here
 COHERE_API_TOKEN=#your cohere api token here
+GOOGLE_GENAI_API_KEY=#your google genai api token here
 HF_ACCESS_TOKEN=#LEGACY! Use HF_TOKEN instead

docs/source/configuration/models/providers/google.md CHANGED Viewed

@@ -52,7 +52,11 @@ MODELS=`[
 Or use the Gemini API API provider [from](https://github.com/google-gemini/generative-ai-js#readme):
-> Make sure that you have an API key from Google Cloud Platform. To get an API key, follow the instructions [here](https://cloud.google.com/docs/authentication/api-keys).
 ```ini
 MODELS=`[
@@ -63,12 +67,12 @@ MODELS=`[
     "endpoints": [
       {
         "type": "genai",
         "apiKey": "abc...xyz"
       }
     ]
-    // Optional
-    "safetyThreshold": "BLOCK_MEDIUM_AND_ABOVE",
   },
   {
     "name": "gemini-1.5-pro",
@@ -77,6 +81,8 @@ MODELS=`[
     "endpoints": [
       {
         "type": "genai",
         "apiKey": "abc...xyz"
       }
     ]

 Or use the Gemini API API provider [from](https://github.com/google-gemini/generative-ai-js#readme):
+Make sure that you have an API key from Google Cloud Platform. To get an API key, follow the instructions [here](https://ai.google.dev/gemini-api/docs/api-key).
+You can either specify them directly in your `.env.local` using the `GOOGLE_GENAI_API_KEY` variables, or you can set them directly in the endpoint config.
+You can find the list of models available [here](https://ai.google.dev/gemini-api/docs/models/gemini), and experimental models available [here](https://ai.google.dev/gemini-api/docs/models/experimental-models).
 ```ini
 MODELS=`[
     "endpoints": [
       {
         "type": "genai",
+        // Optional
         "apiKey": "abc...xyz"
+        "safetyThreshold": "BLOCK_MEDIUM_AND_ABOVE",
       }
     ]
   },
   {
     "name": "gemini-1.5-pro",
     "endpoints": [
       {
         "type": "genai",
+        // Optional
         "apiKey": "abc...xyz"
       }
     ]

src/lib/server/endpoints/google/endpointGenAI.ts CHANGED Viewed

@@ -1,17 +1,18 @@
 import { GoogleGenerativeAI, HarmBlockThreshold, HarmCategory } from "@google/generative-ai";
-import type { Content, Part, TextPart } from "@google/generative-ai";
 import { z } from "zod";
 import type { Message, MessageFile } from "$lib/types/Message";
 import type { TextGenerationStreamOutput } from "@huggingface/inference";
 import type { Endpoint } from "../endpoints";
 import { createImageProcessorOptionsValidator, makeImageProcessor } from "../images";
 import type { ImageProcessorOptions } from "../images";
 export const endpointGenAIParametersSchema = z.object({
 	weight: z.number().int().positive().default(1),
 	model: z.any(),
 	type: z.literal("genai"),
-	apiKey: z.string(),
 	safetyThreshold: z
 		.enum([
 			HarmBlockThreshold.HARM_BLOCK_THRESHOLD_UNSPECIFIED,
@@ -40,35 +41,24 @@ export function endpointGenAI(input: z.input<typeof endpointGenAIParametersSchem
 	const genAI = new GoogleGenerativeAI(apiKey);
 	return async ({ messages, preprompt, generateSettings }) => {
 		const parameters = { ...model.parameters, ...generateSettings };
 		const generativeModel = genAI.getGenerativeModel({
 			model: model.id ?? model.name,
-			safetySettings: safetyThreshold
-				? [
-						{
-							category: HarmCategory.HARM_CATEGORY_DANGEROUS_CONTENT,
-							threshold: safetyThreshold,
-						},
-						{
-							category: HarmCategory.HARM_CATEGORY_HARASSMENT,
-							threshold: safetyThreshold,
-						},
-						{
-							category: HarmCategory.HARM_CATEGORY_HATE_SPEECH,
-							threshold: safetyThreshold,
-						},
-						{
-							category: HarmCategory.HARM_CATEGORY_SEXUALLY_EXPLICIT,
-							threshold: safetyThreshold,
-						},
-						{
-							category: HarmCategory.HARM_CATEGORY_UNSPECIFIED,
-							threshold: safetyThreshold,
-						},
-				  ]
-				: undefined,
 			generationConfig: {
 				maxOutputTokens: parameters?.max_new_tokens ?? 4096,
 				stopSequences: parameters?.stop,

 import { GoogleGenerativeAI, HarmBlockThreshold, HarmCategory } from "@google/generative-ai";
+import type { Content, Part, SafetySetting, TextPart } from "@google/generative-ai";
 import { z } from "zod";
 import type { Message, MessageFile } from "$lib/types/Message";
 import type { TextGenerationStreamOutput } from "@huggingface/inference";
 import type { Endpoint } from "../endpoints";
 import { createImageProcessorOptionsValidator, makeImageProcessor } from "../images";
 import type { ImageProcessorOptions } from "../images";
+import { env } from "$env/dynamic/private";
 export const endpointGenAIParametersSchema = z.object({
 	weight: z.number().int().positive().default(1),
 	model: z.any(),
 	type: z.literal("genai"),
+	apiKey: z.string().default(env.GOOGLE_GENAI_API_KEY),
 	safetyThreshold: z
 		.enum([
 			HarmBlockThreshold.HARM_BLOCK_THRESHOLD_UNSPECIFIED,
 	const genAI = new GoogleGenerativeAI(apiKey);
+	const safetySettings = safetyThreshold
+		? Object.keys(HarmCategory)
+				.filter((cat) => cat !== HarmCategory.HARM_CATEGORY_UNSPECIFIED)
+				.reduce((acc, val) => {
+					acc.push({
+						category: val as HarmCategory,
+						threshold: safetyThreshold,
+					});
+					return acc;
+				}, [] as SafetySetting[])
+		: undefined;
 	return async ({ messages, preprompt, generateSettings }) => {
 		const parameters = { ...model.parameters, ...generateSettings };
 		const generativeModel = genAI.getGenerativeModel({
 			model: model.id ?? model.name,
+			safetySettings,
 			generationConfig: {
 				maxOutputTokens: parameters?.max_new_tokens ?? 4096,
 				stopSequences: parameters?.stop,