GoogleCloudPlatform · cabljac · Nov 29, 2024 · Nov 26, 2024 · Nov 28, 2024 · Nov 28, 2024
diff --git a/firestore-multimodal-genai/CHANGELOG.md b/firestore-multimodal-genai/CHANGELOG.md
@@ -1,6 +1,8 @@
 ## Version 1.0.1
 
-fix - update default Gemini models
+- refactor: add Genkit SDK dependency
+
+- fix - update default Gemini models
 
 ## Version 1.0.0
 

diff --git a/firestore-multimodal-genai/POSTINSTALL.md b/firestore-multimodal-genai/POSTINSTALL.md
@@ -40,11 +40,13 @@ For Vertex AI, the list of models is [here](https://cloud.google.com/vertex-ai/d
 
 #### Multimodal Prompts
 
-The Gemini Pro Vision model accepts multimodal prompts. This extension allows for multimodal prompting using this model.
+Many of the Gemini models accept multimodal prompts. This extension allows for multimodal prompting with images using this model.
 
 On installation you may pick an `image` field. The image field must be the Cloud Storage URL of an object (e.g `gs://my-bucket.appspot.com/filename.png`). This image will then be provided as part of the prompt to Gemini Pro Vision.
 
-Note that Google AI requires prompts to have both an image and text part, whereas Vertex AI allows gemini-pro-vision to be prompted with text only as well. If you have selected to use the Gemini Pro Vision model and have Google AI as a provider then any document handled by the extension must contain an image field.
+Note that Google AI requires prompts to have both an image and text part, whereas Vertex AI allows gemini-pro-vision to be prompted with text only as well.
+
+If you have selected to use the Gemini Pro Vision model (deprecated) and have Google AI as a provider then any document handled by the extension must contain an image field.
 
 The Gemini Pro Vision API has a limit on image sizes. For Google AI this limit is currently 1MB, and for Vertex AI this limit is 4MB. This extension compress and resize images that fall above this limit.
 

diff --git a/firestore-multimodal-genai/functions/__tests__/genkit/client.test.ts b/firestore-multimodal-genai/functions/__tests__/genkit/client.test.ts
@@ -0,0 +1,317 @@
+import {GenkitGenerativeClient} from '../../src/generative-client/genkit';
+import {logger} from 'firebase-functions/v1';
+import {GenerateResponse, genkit} from 'genkit';
+import {googleAI} from '@genkit-ai/googleai';
+import {vertexAI} from '@genkit-ai/vertexai';
+import {Config} from '../../src/config.js';
+import {HarmBlockThreshold, HarmCategory} from '@google/generative-ai';
+
+// Mock the genkit library
+jest.mock('genkit', () => ({
+  genkit: jest.fn().mockReturnValue({generate: jest.fn()}),
+}));
+
+jest.mock('@genkit-ai/googleai', () => ({
+  googleAI: jest.fn().mockReturnValue({name: 'googleai'}),
+  gemini10Pro: {name: 'googleai/gemini-1.0-pro', withVersion: jest.fn()},
+  gemini15Flash: {name: 'googleai/gemini-1.5-flash', withVersion: jest.fn()},
+  gemini15Pro: {name: 'googleai/gemini-1.5-pro', withVersion: jest.fn()},
+}));
+
+jest.mock('@genkit-ai/vertexai', () => ({
+  vertexAI: jest.fn().mockReturnValue({name: 'vertexai'}),
+  gemini10Pro: {name: 'vertexai/gemini-1.0-pro', withVersion: jest.fn()},
+  gemini15Flash: {name: 'vertexai/gemini-1.5-flash', withVersion: jest.fn()},
+  gemini15Pro: {name: 'vertexai/gemini-1.5-pro', withVersion: jest.fn()},
+}));
+
+jest.mock('../../src/generative-client/image_utils.ts', () => ({
+  getImageBase64: jest.fn(() => Promise.resolve('base64EncodedImage')),
+}));
+
+describe('GenkitGenerativeClient', () => {
+  const mockConfig: Config = {
+    vertex: {
+      model: 'gemini-1.5-flash',
+    },
+    googleAi: {
+      model: 'gemini-1.5-flash',
+      apiKey: 'test-api-key',
+    },
+    model: 'gemini-1.5-flash',
+    location: 'us-central1',
+    projectId: 'test-project',
+    instanceId: 'test-instance',
+    prompt: 'Test prompt',
+    responseField: 'output',
+    collectionName: 'users/{uid}/discussions/{discussionId}/messages',
+    temperature: 0.7,
+    topP: 0.9,
+    topK: 50,
+    candidates: {
+      field: 'candidates',
+      count: 1,
+      shouldIncludeCandidatesField: false,
+    },
+    maxOutputTokens: 256,
+    maxOutputTokensVertex: 1024,
+    provider: 'google-ai',
+    apiKey: 'test-api-key',
+    safetySettings: [
+      {
+        category: HarmCategory.HARM_CATEGORY_DANGEROUS_CONTENT,
+        threshold: HarmBlockThreshold.BLOCK_LOW_AND_ABOVE,
+      },
+    ],
+    bucketName: 'test-bucket',
+    imageField: 'image',
+  };
+
+  const mockGenerateResponse = {
+    text: 'Generated text response',
+    finishReason: 'stop',
+    usage: {
+      inputTokens: 10,
+      outputTokens: 20,
+      totalTokens: 30,
+    },
+    custom: null,
+    raw: null,
+  };
+
+  beforeEach(() => {
+    jest.clearAllMocks();
+  });
+
+  it('should initialize with correct plugin and client for Google AI', () => {
+    new GenkitGenerativeClient(mockConfig);
+
+    expect(googleAI).toHaveBeenCalledWith({apiKey: 'test-api-key'});
+    expect(genkit).toHaveBeenCalledWith({
+      plugins: [expect.anything()],
+    });
+  });
+
+  it('should initialize with correct plugin and client for Vertex AI', () => {
+    const vertexConfig: Config = {
+      ...mockConfig,
+      provider: 'vertex-ai',
+      googleAi: {model: 'gemini-1.5-flash', apiKey: '123'},
+      model: 'gemini-1.5-flash',
+    };
+    new GenkitGenerativeClient(vertexConfig);
+
+    expect(vertexAI).toHaveBeenCalledWith({location: 'us-central1'});
+    expect(genkit).toHaveBeenCalledWith({
+      plugins: [expect.anything()],
+    });
+  });
+
+  it('should throw an error if no API key is provided for Google AI', () => {
+    const invalidConfig: Config = {
+      ...mockConfig,
+      googleAi: {model: 'gemini-1.5-flash', apiKey: undefined},
+    };
+
+    expect(() => new GenkitGenerativeClient(invalidConfig)).toThrow(
+      'API key required for Google AI.'
+    );
+  });
+
+  it('should throw an error if an invalid provider is specified', () => {
+    const invalidConfig: Config = {...mockConfig, provider: 'invalid-provider'};
+
+    expect(() => new GenkitGenerativeClient(invalidConfig)).toThrow(
+      'Invalid provider specified.'
+    );
+  });
+
+  it('should create the correct model reference', () => {
+    const modelReference = GenkitGenerativeClient.createModelReference(
+      'gemini-1.5-flash',
+      'google-ai'
+    );
+    expect(modelReference === null).toBe(false);
+
+    expect(modelReference).toHaveProperty('name');
+
+    expect(modelReference!.name).toBe('googleai/gemini-1.5-flash');
+  });
+
+  it('should call generate with correct options and return response', async () => {
+    const client = new GenkitGenerativeClient(mockConfig);
+    client.client.generate = jest.fn(() =>
+      Promise.resolve(mockGenerateResponse as unknown as GenerateResponse<any>)
+    );
+
+    const response = await client.generate('Test prompt');
+
+    expect(client.client.generate).toHaveBeenCalledWith({
+      messages: [
+        {
+          role: 'user',
+          content: [{text: 'Test prompt'}],
+        },
+      ],
+      model: expect.any(Object),
+      config: expect.any(Object),
+    });
+
+    expect(response).toEqual({candidates: ['Generated text response']});
+  });
+
+  it('should process an image if provided', async () => {
+    const client = new GenkitGenerativeClient(mockConfig);
+    client.client.generate = jest.fn(() =>
+      Promise.resolve(mockGenerateResponse as unknown as GenerateResponse<any>)
+    );
+
+    const response = await client.generate('Test prompt', {
+      image: 'path/to/image.jpg',
+    });
+
+    expect(client.client.generate).toHaveBeenCalledWith({
+      messages: [
+        {
+          role: 'user',
+          content: [
+            {text: 'Test prompt'},
+            {media: {url: 'data:image/jpeg;base64,base64EncodedImage'}},
+          ],
+        },
+      ],
+      model: {
+        name: 'googleai/gemini-1.5-flash',
+        withVersion: expect.any(Function),
+      },
+      config: {
+        topP: 0.9,
+        topK: 50,
+        temperature: 0.7,
+        maxOutputTokens: 256,
+        safetySettings: [
+          {
+            category: HarmCategory.HARM_CATEGORY_DANGEROUS_CONTENT,
+            threshold: HarmBlockThreshold.BLOCK_LOW_AND_ABOVE,
+          },
+        ],
+      },
+      image: 'path/to/image.jpg',
+    });
+
+    expect(response).toEqual({candidates: ['Generated text response']});
+  });
+
+  it('should log an error and throw if generate fails', async () => {
+    const client = new GenkitGenerativeClient(mockConfig);
+    const error = new Error('Generation failed');
+    client.client.generate = jest.fn(() => Promise.reject(error));
+    logger.error = jest.fn();
+
+    await expect(client.generate('Test prompt')).rejects.toThrow(
+      'Content generation failed.'
+    );
+
+    expect(logger.error).toHaveBeenCalledWith(
+      'Failed to generate content:',
+      error
+    );
+  });
+});
+
+describe('GenkitGenerativeClient.shouldUseGenkitClient', () => {
+  const baseConfig: Config = {
+    vertex: {model: 'gemini-1.0-pro'},
+    googleAi: {model: 'gemini-1.5-flash', apiKey: 'test-api-key'},
+    model: 'gemini-1.5-flash',
+    location: 'us-central1',
+    projectId: 'test-project',
+    instanceId: 'test-instance',
+    prompt: 'Test prompt',
+    responseField: 'output',
+    collectionName: 'users/{uid}/discussions/{discussionId}/messages',
+    temperature: 0.7,
+    topP: 0.9,
+    topK: 50,
+    candidates: {
+      field: 'candidates',
+      count: 1,
+      shouldIncludeCandidatesField: false,
+    },
+    maxOutputTokens: 256,
+    maxOutputTokensVertex: 1024,
+    provider: 'google-ai',
+    apiKey: 'test-api-key',
+    safetySettings: [
+      {
+        category: HarmCategory.HARM_CATEGORY_HARASSMENT,
+        threshold: HarmBlockThreshold.BLOCK_LOW_AND_ABOVE,
+      },
+    ],
+    bucketName: 'test-bucket',
+    imageField: 'image',
+  };
+
+  beforeEach(() => {
+    jest.clearAllMocks();
+  });
+
+  it('should return false if the model includes "pro-vision"', () => {
+    const config = {...baseConfig, model: 'gemini-pro-vision'};
+
+    const result = GenkitGenerativeClient.shouldUseGenkitClient(config);
+
+    expect(result).toBe(false);
+  });
+
+  it('should return false if multiple candidates are requested', () => {
+    const config = {
+      ...baseConfig,
+      candidates: {
+        field: 'candidates',
+        count: 2,
+        shouldIncludeCandidatesField: true,
+      },
+    };
+
+    const result = GenkitGenerativeClient.shouldUseGenkitClient(config);
+
+    expect(result).toBe(false);
+  });
+
+  it('should return false if no model reference is found', () => {
+    const config = {...baseConfig, model: 'unknown-model'};
+
+    jest
+      .spyOn(GenkitGenerativeClient, 'createModelReference')
+      .mockReturnValueOnce(null);
+
+    const result = GenkitGenerativeClient.shouldUseGenkitClient(config);
+
+    expect(result).toBe(false);
+  });
+
+  it('should return true if conditions are met for Genkit client usage', () => {
+    const config = {...baseConfig, model: 'gemini-1.5-flash'};
+
+    jest
+      .spyOn(GenkitGenerativeClient, 'createModelReference')
+      .mockReturnValueOnce({
+        name: 'googleai/gemini-1.5-flash',
+        withVersion: jest.fn(),
+        withConfig: jest.fn(),
+      });
+
+    const result = GenkitGenerativeClient.shouldUseGenkitClient(config);
+
+    expect(result).toBe(true);
+  });
+
+  it('should call createModelReference with correct parameters', () => {
+    const spy = jest.spyOn(GenkitGenerativeClient, 'createModelReference');
+
+    GenkitGenerativeClient.shouldUseGenkitClient(baseConfig);
+
+    expect(spy).toHaveBeenCalledWith('gemini-1.5-flash', 'google-ai');
+  });
+});