Skip to content

Commit

Permalink
fix max tokens
Browse files Browse the repository at this point in the history
  • Loading branch information
teetone committed May 5, 2024
1 parent ae67281 commit edce2dc
Show file tree
Hide file tree
Showing 3 changed files with 6 additions and 5 deletions.
1 change: 1 addition & 0 deletions src/helm/benchmark/model_metadata_registry.py
Original file line number Diff line number Diff line change
Expand Up @@ -32,6 +32,7 @@

GOOGLE_PALM_2_MODEL_TAG: str = "GOOGLE_PALM_2_MODEL_TAG"
GOOGLE_GEMINI_MODEL_TAG: str = "GOOGLE_GEMINI_MODEL_TAG"
GOOGLE_GEMINI_PRO_VISION_V1_TAG: str = "GOOGLE_GEMINI_PRO_VISION_V1_TAG"
GOOGLE_GEMMA_INSTRUCT_MODEL_TAG: str = "GOOGLE_GEMMA_INSTRUCT_MODEL_TAG"

# Models which emit garbage tokens when temperature=0.
Expand Down
6 changes: 3 additions & 3 deletions src/helm/benchmark/run_spec_factory.py
Original file line number Diff line number Diff line change
Expand Up @@ -16,7 +16,7 @@
ANTHROPIC_CLAUDE_3_MODEL_TAG,
BUGGY_TEMP_0_TAG,
CHATML_MODEL_TAG,
GOOGLE_GEMINI_MODEL_TAG,
GOOGLE_GEMINI_PRO_VISION_V1_TAG,
IDEFICS_INSTRUCT_MODEL_TAG,
LLAVA_MODEL_TAG,
OPEN_FLAMINGO_MODEL_TAG,
Expand Down Expand Up @@ -130,10 +130,10 @@ def alter_run_spec(run_spec: RunSpec) -> RunSpec:
if ANTHROPIC_CLAUDE_3_MODEL_TAG in model.tags:
run_spec = singleton(AnthropicClaude3RunExpander().expand(run_spec))

# Google Gemini Vision returns an empty completion or throws an error if max_tokens is 1
# Google Gemini Vision v1.0 returns an empty completion or throws an error if max_tokens is 1
if (
VISION_LANGUAGE_MODEL_TAG in model.tags
and GOOGLE_GEMINI_MODEL_TAG in model.tags
and GOOGLE_GEMINI_PRO_VISION_V1_TAG in model.tags
and run_spec.adapter_spec.max_tokens == 1
):
run_spec = singleton(IncreaseMaxTokensRunExpander(value=1).expand(run_spec))
Expand Down
4 changes: 2 additions & 2 deletions src/helm/config/model_metadata.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -695,10 +695,10 @@ models:
creator_organization_name: Google
access: limited
release_date: 2023-12-13
tags: [VISION_LANGUAGE_MODEL_TAG, GOOGLE_GEMINI_MODEL_TAG, LIMITED_FUNCTIONALITY_TEXT_MODEL_TAG]
tags: [VISION_LANGUAGE_MODEL_TAG, GOOGLE_GEMINI_MODEL_TAG, GOOGLE_GEMINI_PRO_VISION_V1_TAG, LIMITED_FUNCTIONALITY_TEXT_MODEL_TAG]

- name: google/gemini-1.5-pro-preview-0409
display_name: Gemini 1.5 Pro
display_name: Gemini 1.5 Pro (preview - 0409)
description: Gemini 1.5 Pro is a multimodal mixture-of-experts model capable of recalling and reasoning over fine-grained information from long contexts. ([paper](https://arxiv.org/abs/2403.05530))
creator_organization_name: Google
access: limited
Expand Down

0 comments on commit edce2dc

Please sign in to comment.