Skip to content

Commit 6d53416

Browse files
brb-nvmikeiovine
authored andcommitted
[https://nvbugs/5568836][fix] Skip keyword matching for Gemma3 e2e test (NVIDIA#9158)
Signed-off-by: Balaram Buddharaju <169953907+brb-nv@users.noreply.github.com> Signed-off-by: Mike Iovine <6158008+mikeiovine@users.noreply.github.com> Signed-off-by: Mike Iovine <miovine@nvidia.com>
1 parent 0204dc7 commit 6d53416

File tree

1 file changed

+24
-19
lines changed

1 file changed

+24
-19
lines changed

tests/integration/defs/test_e2e.py

Lines changed: 24 additions & 19 deletions
Original file line numberDiff line numberDiff line change
@@ -2521,13 +2521,6 @@ def test_ptp_quickstart_multimodal(llm_root, llm_venv, model_name, model_path,
25212521
[["invention", "person", "scientists", "Lick", "engineers"],
25222522
["landscape", "trees", "road", "depicts", "scenic"]]
25232523
},
2524-
"gemma-3-27b-it": {
2525-
"image": [
2526-
["natural", "turbulent", "dramatic", "scene", "wave"],
2527-
["image", "famous", "rock", "granite", "landmark"],
2528-
["traffic", "moderate", "heavy", "flowing", "cars"],
2529-
],
2530-
},
25312524
}
25322525

25332526
cmd = [
@@ -2557,6 +2550,14 @@ def test_ptp_quickstart_multimodal(llm_root, llm_venv, model_name, model_path,
25572550

25582551
output = llm_venv.run_cmd(cmd, caller=check_output)
25592552

2553+
# For gemma-3-27b-it, we only smoke test the model. Keyword matching is flaky.
2554+
if model_name == "gemma-3-27b-it":
2555+
print(
2556+
f"Skipping keyword matching test for {model_name}. Smoke test completed successfully."
2557+
)
2558+
print("output:", output)
2559+
return
2560+
25602561
match_ratio = 4.0 / 5
25612562
parsed_outputs = parse_output(output)
25622563
for prompt_output, prompt_keywords in zip(
@@ -2994,12 +2995,6 @@ def test_ptp_quickstart_multimodal_2gpu(llm_root, llm_venv, model_name,
29942995

29952996
# Define expected keywords for each model
29962997
expected_keywords = {
2997-
"gemma-3-27b-it": {
2998-
"image": [
2999-
["half", "dome", "yosemite", "landmark", "rounded"],
3000-
["flowing", "traffic", "vehicles", "road", "Changi"],
3001-
],
3002-
},
30032998
"mistral-small-3.1-24b-instruct": {
30042999
"image": [
30053000
["scenic", "rock", "landscape", "monolith", "formation"],
@@ -3066,6 +3061,14 @@ def test_ptp_quickstart_multimodal_2gpu(llm_root, llm_venv, model_name,
30663061

30673062
output = llm_venv.run_cmd(cmd, caller=check_output)
30683063

3064+
# For gemma-3-27b-it, we only smoke test the model. Keyword matching is flaky.
3065+
if model_name == "gemma-3-27b-it":
3066+
print(
3067+
f"Skipping keyword matching test for {model_name}. Smoke test completed successfully."
3068+
)
3069+
print("output:", output)
3070+
return
3071+
30693072
# Set match ratio based on model
30703073
match_ratio = 4.0 / 5
30713074
if model_name.startswith("phi4-multimodal-instruct"):
@@ -3120,12 +3123,6 @@ def test_ptp_quickstart_multimodal_multiturn(llm_root, llm_venv, model_name,
31203123

31213124
# Define expected keywords for each model
31223125
expected_keywords = {
3123-
"gemma-3-27b-it": {
3124-
"image": [
3125-
["description", "image", "half", "dome", "park"],
3126-
["atmosphere", "peaceful", "majestic", "scene", "sky"],
3127-
],
3128-
},
31293126
"mistral-small-3.1-24b-instruct": {
31303127
"image": [
31313128
[
@@ -3192,6 +3189,14 @@ def test_ptp_quickstart_multimodal_multiturn(llm_root, llm_venv, model_name,
31923189

31933190
output = llm_venv.run_cmd(cmd, caller=check_output)
31943191
print("output:", output)
3192+
3193+
# For gemma-3-27b-it, we only smoke test the model. Keyword matching is flaky.
3194+
if model_name == "gemma-3-27b-it":
3195+
print(
3196+
f"Skipping keyword matching test for {model_name}. Smoke test completed successfully."
3197+
)
3198+
return
3199+
31953200
# Set match ratio based on model
31963201
match_ratio = 4.0 / 5
31973202
if model_name.startswith("Phi-4-multimodal-instruct"):

0 commit comments

Comments
 (0)