feat: Add example for multimodal streaming response

arbrown · arbrown · commit 3a2c53d01c47 · 2024-05-03T16:28:22.000-06:00
diff --git a/generative-ai/snippets/inference/nonStreamMultiModalityBasic.js b/generative-ai/snippets/inference/nonStreamMultiModalityBasic.js
@@ -42,7 +42,7 @@ async function generateContent(
           {
             file_data: {
               file_uri: 'gs://generativeai-downloads/images/character.jpg',
-              mime_type: 'video/mp4',
+              mime_type: 'image/jpeg',
             },
           },
         ],
diff --git a/generative-ai/snippets/inference/streamMultiModalityBasic.js b/generative-ai/snippets/inference/streamMultiModalityBasic.js
@@ -0,0 +1,64 @@
+// Copyright 2024 Google LLC
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     https://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+// [START generativeaionvertexai_stream_multimodality_basic]
+const {VertexAI} = require('@google-cloud/vertexai');
+
+/**
+ * TODO(developer): Update these variables before running the sample.
+ */
+async function generateContent(
+  projectId = 'PROJECT_ID',
+  location = 'us-central1',
+  model = 'gemini-1.5-pro-preview-0409'
+) {
+  // Initialize Vertex AI
+  const vertexAI = new VertexAI({project: projectId, location: location});
+  const generativeModel = vertexAI.getGenerativeModel({model: model});
+
+  const request = {
+    contents: [
+      {
+        role: 'user',
+        parts: [
+          {text: 'Are following video and image correlated?'},
+          {
+            file_data: {
+              file_uri: 'gs://cloud-samples-data/video/animals.mp4',
+              mime_type: 'video/mp4',
+            },
+          },
+          {
+            file_data: {
+              file_uri: 'gs://generativeai-downloads/images/character.jpg',
+              mime_type: 'image/jpeg',
+            },
+          },
+        ],
+      },
+    ],
+  };
+
+  const result = await generativeModel.generateContentStream(request);
+
+  for await (const item of result.stream) {
+    console.log(item.candidates[0].content.parts[0].text);
+  }
+}
+// [END generativeaionvertexai_stream_multimodality_basic]
+
+generateContent(...process.argv.slice(2)).catch(err => {
+  console.error(err.message);
+  process.exitCode = 1;
+});
diff --git a/generative-ai/snippets/test/inference/streamMultiModalityBasic.test.js b/generative-ai/snippets/test/inference/streamMultiModalityBasic.test.js
@@ -0,0 +1,41 @@
+// Copyright 2024 Google LLC
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     https://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+'use strict';
+
+const {assert} = require('chai');
+const {describe, it} = require('mocha');
+const cp = require('child_process');
+const execSync = cmd => cp.execSync(cmd, {encoding: 'utf-8'});
+
+const projectId = process.env.CAIP_PROJECT_ID;
+const location = process.env.LOCATION;
+const model = 'gemini-1.0-pro';
+
+describe('Generative AI Basic Text Inference Streaming', () => {
+  /**
+   * TODO(developer): Uncomment these variables before running the sample.\
+   * (Not necessary if passing values as arguments)
+   */
+  // const projectId = 'YOUR_PROJECT_ID';
+  // const location = 'YOUR_LOCATION';
+  // const model = 'gemini-1.0-pro';
+
+  it('should create a generative text model and infer text from a prompt, streaming the results', async () => {
+    const output = execSync(
+      `node ./inference/streamMultiModalityBasic.js ${projectId} ${location} ${model}`
+    );
+    assert(output.length > 0);
+  });
+});

Original file line number	Diff line number	Diff line change
`@@ -42,7 +42,7 @@ async function generateContent(`
`42`	`42`	`{`
`43`	`43`	`file_data: {`
`44`	`44`	`file_uri: 'gs://generativeai-downloads/images/character.jpg',`
`45`		`- mime_type: 'video/mp4',`
	`45`	`+ mime_type: 'image/jpeg',`
`46`	`46`	`},`
`47`	`47`	`},`
`48`	`48`	`],`