diff --git a/src/helm/config/model_deployments.yaml b/src/helm/config/model_deployments.yaml index bb9aed655f..2b21f84606 100644 --- a/src/helm/config/model_deployments.yaml +++ b/src/helm/config/model_deployments.yaml @@ -553,6 +553,14 @@ model_deployments: client_spec: class_name: "helm.clients.vertexai_client.VertexAIChatClient" + - name: google/gemini-2.0-flash-exp + model_name: google/gemini-2.0-flash-exp + tokenizer_name: google/gemma-2b # Gemini has no tokenizer endpoint, so we approximate by using Gemma's tokenizer. + max_sequence_length: 1000000 # Source: https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-models + # TODO: Max output tokens: 8192 + client_spec: + class_name: "helm.clients.vertexai_client.VertexAIChatClient" + ## Gemma - name: together/gemma-2b model_name: google/gemma-2b diff --git a/src/helm/config/model_metadata.yaml b/src/helm/config/model_metadata.yaml index 84227602ca..1728216ed5 100644 --- a/src/helm/config/model_metadata.yaml +++ b/src/helm/config/model_metadata.yaml @@ -997,6 +997,14 @@ models: release_date: 2024-09-24 tags: [TEXT_MODEL_TAG, VISION_LANGUAGE_MODEL_TAG, AUDIO_LANGUAGE_MODEL_TAG, GOOGLE_GEMINI_MODEL_TAG, LIMITED_FUNCTIONALITY_TEXT_MODEL_TAG, INSTRUCTION_FOLLOWING_MODEL_TAG] + - name: google/gemini-2.0-flash-exp + display_name: Gemini 2.0 Flash (Experimental) + description: Gemini 2.0 Flash (Experimental) is a Gemini model that supports multimodal inputs like images, video and audio, as well as multimodal output like natively generated images mixed with text and steerable text-to-speech (TTS) multilingual audio. ([blog](https://blog.google/technology/google-deepmind/google-gemini-ai-update-december-2024/#gemini-2-0-flash)) + creator_organization_name: Google + access: limited + release_date: 2024-12-11 + tags: [TEXT_MODEL_TAG, VISION_LANGUAGE_MODEL_TAG, AUDIO_LANGUAGE_MODEL_TAG, GOOGLE_GEMINI_MODEL_TAG, LIMITED_FUNCTIONALITY_TEXT_MODEL_TAG, INSTRUCTION_FOLLOWING_MODEL_TAG] + - name: google/gemma-2b display_name: Gemma (2B) description: Gemma is a family of lightweight, open models built from the research and technology that Google used to create the Gemini models. ([model card](https://www.kaggle.com/models/google/gemma), [blog post](https://blog.google/technology/developers/gemma-open-models/))