feat: vertex and image compression (#340)

* feat(*): add vertex to gemini exts * feat(*): add some compression to large images * test(firestore-multimodal-genai, firestore-genai-chatbot): added test suite for vertex * fix(firestore-multimodal-genai): update function memory * docs(*): add reference for ADC * test(firestore-multimodal-genai): added more tests * Update firestore-genai-chatbot/extension.yaml Co-authored-by: Mais Alheraki <[email protected]> * Update firestore-multimodal-genai/extension.yaml Co-authored-by: Mais Alheraki <[email protected]> * docs(firestore-multimodal-genai): update postinstall * chore(*): update tsconfigs * chore(*): bump versions * test(storage-reverse-iamge-search): silence logs * test(storage-reverse-iamge-search): fix flaky tests --------- Co-authored-by: Mais Alheraki <[email protected]>
GoogleCloudPlatform · Jan 24, 2024 · 38fd6d4 · 38fd6d4
1 parent 027dff7
commit 38fd6d4
Show file tree

Hide file tree

Showing 44 changed files with 3,094 additions and 7,628 deletions.
diff --git a/firestore-genai-chatbot/CHANGELOG.md b/firestore-genai-chatbot/CHANGELOG.md
@@ -1,3 +1,7 @@
+## Version 0.0.5
+
+- Add Vertex AI provider
+
 ## Version 0.0.4
 
 - Fix context parameter

diff --git a/firestore-genai-chatbot/README.md b/firestore-genai-chatbot/README.md
@@ -73,7 +73,7 @@ Additionally, this extension uses the Google AI Gemini API. For more details on
 
 **Configuration Parameters:**
 
-* Gemini API Provider: This extension makes use of the Gemini family of large language models. Currently the extension only supports the Google AI API (for developers) but in future will support the Vertex AI Gemini API.
+* Gemini API Provider: This extension makes use of the Gemini family of large language models. For Google AI you will require an API key, whereas Vertex AI will authenticate using application default credentials. For more information see the [docs](https://firebase.google.com/docs/admin/setup#initialize-sdk).
 
 * API Key for Gemini: Please enter your API key for the Google AI Gemini API.
 

diff --git a/firestore-genai-chatbot/extension.yaml b/firestore-genai-chatbot/extension.yaml
@@ -1,5 +1,5 @@
 name: firestore-genai-chatbot
-version: 0.0.4
+version: 0.0.5
 specVersion: v1beta
 
 icon: icon.png
@@ -53,10 +53,10 @@ roles:
     reason:
       Allows this extension to access Cloud Firestore to read and process added
       messages.
-  # - role: aiplatform.user
-  #   reason:
-  #     Allows this extension to access the Vertex AI API if this provider is
-  #     chosen.
+  - role: aiplatform.user
+    reason:
+      Allows this extension to access the Vertex AI API if this provider is
+      chosen.
 
 resources:
   - name: generateMessage
@@ -75,12 +75,16 @@ params:
     label: Gemini API Provider
     description: >-
       This extension makes use of the Gemini family of large language models.
-      Currently the extension only supports the Google AI API (for developers)
-      but in future will support the Vertex AI Gemini API.
+      For Google AI you will require an API key, whereas Vertex AI will
+      authenticate using application default credentials. For more information
+      see the
+      [docs](https://firebase.google.com/docs/admin/setup#initialize-sdk).
     type: select
     options:
       - label: Google AI
         value: google-ai
+      - label: Vertex AI
+        value: vertex-ai
     required: true
     default: google-ai
     immutable: false
@@ -90,7 +94,7 @@ params:
     description: >-
       Please enter your API key for the Google AI Gemini API.
     type: secret
-    required: true
+    required: false
     immutable: false
 
   - param: MODEL

diff --git a/...nctions/__tests__/google-ai/index.test.ts → ...nctions/__tests__/google_ai/index.test.ts b/...nctions/__tests__/google-ai/index.test.ts → ...nctions/__tests__/google_ai/index.test.ts
diff --git a/firestore-genai-chatbot/functions/__tests__/vertex_ai/index.test.ts b/firestore-genai-chatbot/functions/__tests__/vertex_ai/index.test.ts
@@ -0,0 +1,285 @@
+import * as firebaseFunctionsTest from 'firebase-functions-test';
+import * as admin from 'firebase-admin';
+import config from '../../src/config';
+import {generateMessage} from '../../src/index';
+import {WrappedFunction} from 'firebase-functions-test/lib/v1';
+import {Change} from 'firebase-functions/v1';
+
+import {QuerySnapshot} from 'firebase-admin/firestore';
+import {expectToProcessCorrectly} from '../util';
+
+process.env.GCLOUD_PROJECT = 'demo-gcp';
+
+process.env.FIRESTORE_EMULATOR_HOST = '127.0.0.1:8080';
+
+// // We mock out the config here instead of setting environment variables directly
+jest.mock('../../src/config', () => ({
+  default: {
+    googleAi: {
+      model: 'gemini-pro',
+      apiKey: 'test-api-key',
+    },
+    vertex: {
+      model: 'gemini-pro',
+    },
+    collectionName: 'discussionsTestGenerative/{discussionId}/messages',
+    location: 'us-central1',
+    orderField: 'createTime',
+    promptField: 'prompt',
+    responseField: 'response',
+    enableDiscussionOptionOverrides: true,
+    candidatesField: 'candidates',
+    provider: 'vertex-ai',
+    model: 'gemini-pro',
+    apiKey: 'test-api-key',
+  },
+}));
+
+// // mock to check the arguments passed to the annotateVideo function+
+const mockGetClient = jest.fn();
+const mockGetModel = jest.fn();
+const mockGenerateContentStream = jest.fn();
+
+jest.mock('@google-cloud/vertexai', () => {
+  return {
+    ...jest.requireActual('@google-cloud/vertexai'),
+    VertexAI: function mockedClient(args) {
+      mockGetClient(args);
+      return {
+        preview: {
+          getGenerativeModel: (args: unknown) => {
+            mockGetModel(args);
+            return {
+              generateContentStream: async function mockedStartChat(args) {
+                mockGenerateContentStream(args);
+                return {
+                  response: {
+                    candidates: [
+                      {
+                        content: {
+                          parts: [
+                            {
+                              text: 'test response',
+                            },
+                          ],
+                        },
+                      },
+                    ],
+                  },
+                };
+              },
+            };
+          },
+        },
+      };
+    },
+  };
+});
+
+const fft = firebaseFunctionsTest({
+  projectId: 'demo-gcp',
+});
+
+admin.initializeApp({
+  projectId: 'demo-gcp',
+});
+
+type DocumentReference = admin.firestore.DocumentReference;
+type DocumentData = admin.firestore.DocumentData;
+type DocumentSnapshot = admin.firestore.DocumentSnapshot<DocumentData>;
+type WrappedFirebaseFunction = WrappedFunction<
+  Change<DocumentSnapshot | undefined>,
+  void
+>;
+const Timestamp = admin.firestore.Timestamp;
+
+const wrappedGenerateMessage = fft.wrap(
+  generateMessage
+) as WrappedFirebaseFunction;
+
+const firestoreObserver = jest.fn((_x: any) => {});
+let collectionName: string;
+
+describe('generateMessage', () => {
+  let unsubscribe: (() => void) | undefined;
+
+  // clear firestore
+  beforeEach(async () => {
+    await fetch(
+      `http://${process.env.FIRESTORE_EMULATOR_HOST}/emulator/v1/projects/demo-gcp/databases/(default)/documents`,
+      {method: 'DELETE'}
+    );
+    jest.clearAllMocks();
+    const randomInteger = Math.floor(Math.random() * 1000000);
+    collectionName = config.collectionName.replace(
+      '{discussionId}',
+      randomInteger.toString()
+    );
+
+    // set up observer on collection
+    unsubscribe = admin
+      .firestore()
+      .collection(collectionName)
+      .onSnapshot((snap: QuerySnapshot) => {
+        /** There is a bug on first init and write, causing the the emulator to the observer is called twice
+         * A snapshot is registered on the first run, this affects the observer count
+         * This is a workaround to ensure the observer is only called when it should be
+         */
+        if (snap.docs.length) firestoreObserver(snap);
+      });
+  });
+  afterEach(() => {
+    if (unsubscribe && typeof unsubscribe === 'function') {
+      unsubscribe();
+    }
+    jest.clearAllMocks();
+  });
+
+  test('should not run if the prompt field is not set', async () => {
+    const notMessage = {
+      notPrompt: 'hello chat bison',
+    };
+    // Make a write to the collection. This won't trigger our wrapped function as it isn't deployed to the emulator.
+    const ref = await admin
+      .firestore()
+      .collection(collectionName)
+      .add(notMessage);
+
+    await simulateFunctionTriggered(wrappedGenerateMessage)(ref);
+
+    await expectNoOp();
+  });
+
+  test('should not run if the prompt field is empty', async () => {
+    const notMessage = {
+      prompt: '',
+    };
+
+    const ref = await admin
+      .firestore()
+      .collection(collectionName)
+      .add(notMessage);
+
+    await simulateFunctionTriggered(wrappedGenerateMessage)(ref);
+
+    await expectNoOp();
+  });
+
+  test('should not run if the prompt field is not a string', async () => {
+    const notMessage = {
+      prompt: 123,
+    };
+
+    const ref = await admin
+      .firestore()
+      .collection(collectionName)
+      .add(notMessage);
+
+    await simulateFunctionTriggered(wrappedGenerateMessage)(ref);
+
+    await expectNoOp();
+  });
+
+  test('should run when given createTime', async () => {
+    const message = {
+      prompt: 'hello chat bison',
+      createTime: Timestamp.now(),
+    };
+    const ref = await admin.firestore().collection(collectionName).add(message);
+
+    await simulateFunctionTriggered(wrappedGenerateMessage)(ref);
+
+    expect(firestoreObserver).toHaveBeenCalledTimes(3);
+
+    const firestoreCallData = firestoreObserver.mock.calls.map(call =>
+      call[0].docs[0].data()
+    );
+
+    expectToProcessCorrectly(
+      firestoreCallData,
+      message,
+      false,
+      'test response'
+    );
+
+    expect(mockGetClient).toHaveBeenCalledTimes(1);
+
+    expect(mockGetModel).toHaveBeenCalledTimes(1);
+    expect(mockGetModel).toBeCalledWith({model: config.googleAi.model});
+    expect(mockGenerateContentStream).toHaveBeenCalledTimes(1);
+    expect(mockGenerateContentStream).toHaveBeenCalledWith({
+      contents: [{parts: [{text: 'hello chat bison'}], role: 'user'}],
+      generation_config: {
+        candidate_count: undefined,
+        max_output_tokens: undefined,
+        temperature: undefined,
+        top_k: undefined,
+        top_p: undefined,
+      },
+    });
+  });
+
+  test('should run when not given createTime', async () => {
+    const message = {
+      prompt: 'hello chat bison',
+    };
+
+    // Make a write to the collection. This won't trigger our wrapped function as it isn't deployed to the emulator.
+    const ref = await admin.firestore().collection(collectionName).add(message);
+
+    const beforeOrderField = await simulateFunctionTriggered(
+      wrappedGenerateMessage
+    )(ref);
+
+    await simulateFunctionTriggered(wrappedGenerateMessage)(
+      ref,
+      beforeOrderField
+    );
+
+    // we expect the firestore observer to be called 4 times total.
+    expect(firestoreObserver).toHaveBeenCalledTimes(3);
+
+    const firestoreCallData = firestoreObserver.mock.calls.map(call => {
+      return call[0].docs[0].data();
+    });
+
+    expectToProcessCorrectly(firestoreCallData, message, true, 'test response');
+
+    // // verify SDK is called with expected arguments
+    // we expect the mock API to be called once
+    expect(mockGetClient).toHaveBeenCalledTimes(1);
+
+    expect(mockGetModel).toHaveBeenCalledTimes(1);
+    expect(mockGetModel).toBeCalledWith({model: config.googleAi.model});
+    expect(mockGenerateContentStream).toHaveBeenCalledTimes(1);
+    expect(mockGenerateContentStream).toHaveBeenCalledWith({
+      contents: [{parts: [{text: 'hello chat bison'}], role: 'user'}],
+      generation_config: {
+        candidate_count: undefined,
+        max_output_tokens: undefined,
+        temperature: undefined,
+        top_k: undefined,
+        top_p: undefined,
+      },
+    });
+  });
+});
+
+const simulateFunctionTriggered =
+  (wrappedFunction: WrappedFirebaseFunction) =>
+  async (ref: DocumentReference, before?: DocumentSnapshot) => {
+    const data = (await ref.get()).data() as {[key: string]: unknown};
+    const beforeFunctionExecution = fft.firestore.makeDocumentSnapshot(
+      data,
+      `${collectionName}/${ref.id}`
+    ) as DocumentSnapshot;
+    const change = fft.makeChange(before, beforeFunctionExecution);
+    await wrappedFunction(change);
+    return beforeFunctionExecution;
+  };
+
+const expectNoOp = async () => {
+  await new Promise(resolve => setTimeout(resolve, 100));
+  expect(firestoreObserver).toHaveBeenCalledTimes(1);
+  expect(mockGetModel).toHaveBeenCalledTimes(0);
+};