chat-ui-energy

Running

App Files Files Community

goupilew

nsarrazin commited on May 3, 2024

Commit

61d56f7

unverified ·

1 Parent(s): ba87c5b

[VertexAI] Add support for tools parameter (#1065)

Browse files

* [VertexAI] Add support for tools parameter

* Simplify tools parameter parsing and add support for passing parameters in model

---------

Co-authored-by: Nathan Sarrazin <[email protected]>

Files changed (2) hide show

README.md +6 -1
src/lib/server/endpoints/google/endpointVertex.ts +8 -4

README.md CHANGED Viewed

@@ -619,7 +619,12 @@ MODELS=`[
           // Optional
           "safetyThreshold": "BLOCK_MEDIUM_AND_ABOVE",
-          "apiEndpoint": "", // alternative api endpoint url
        }]
      },
 ]`

           // Optional
           "safetyThreshold": "BLOCK_MEDIUM_AND_ABOVE",
+          "apiEndpoint": "", // alternative api endpoint url,
+          "tools": [{
+            "googleSearchRetrieval": {
+              "disableAttribution": true
+            }
+          }]
        }]
      },
 ]`

src/lib/server/endpoints/google/endpointVertex.ts CHANGED Viewed

@@ -26,10 +26,11 @@ export const endpointVertexParametersSchema = z.object({
 			HarmBlockThreshold.BLOCK_ONLY_HIGH,
 		])
 		.optional(),
 });
 export function endpointVertex(input: z.input<typeof endpointVertexParametersSchema>): Endpoint {
-	const { project, location, model, apiEndpoint, safetyThreshold } =
 		endpointVertexParametersSchema.parse(input);
 	const vertex_ai = new VertexAI({
@@ -39,6 +40,8 @@ export function endpointVertex(input: z.input<typeof endpointVertexParametersSch
 	});
 	return async ({ messages, preprompt, generateSettings }) => {
 		const generativeModel = vertex_ai.getGenerativeModel({
 			model: model.id ?? model.name,
 			safetySettings: safetyThreshold
@@ -66,10 +69,11 @@ export function endpointVertex(input: z.input<typeof endpointVertexParametersSch
 				  ]
 				: undefined,
 			generationConfig: {
-				maxOutputTokens: generateSettings?.max_new_tokens ?? 4096,
-				stopSequences: generateSettings?.stop,
-				temperature: generateSettings?.temperature ?? 1,
 			},
 		});
 		// Preprompt is the same as the first system message.

 			HarmBlockThreshold.BLOCK_ONLY_HIGH,
 		])
 		.optional(),
+	tools: z.array(z.any()),
 });
 export function endpointVertex(input: z.input<typeof endpointVertexParametersSchema>): Endpoint {
+	const { project, location, model, apiEndpoint, safetyThreshold, tools } =
 		endpointVertexParametersSchema.parse(input);
 	const vertex_ai = new VertexAI({
 	});
 	return async ({ messages, preprompt, generateSettings }) => {
+		const parameters = { ...model.parameters, ...generateSettings };
 		const generativeModel = vertex_ai.getGenerativeModel({
 			model: model.id ?? model.name,
 			safetySettings: safetyThreshold
 				  ]
 				: undefined,
 			generationConfig: {
+				maxOutputTokens: parameters?.max_new_tokens ?? 4096,
+				stopSequences: parameters?.stop,
+				temperature: parameters?.temperature ?? 1,
 			},
+			tools,
 		});
 		// Preprompt is the same as the first system message.