Skip to content

Commit 675ed6c

Browse files
authored
[llm bench] Fix setting ATTENTION_BACKEND to plugin config in case of fallback to Optimum (#2332)
[CVS-168817](https://jira.devtools.intel.com/browse/CVS-168817)
1 parent 69afd4c commit 675ed6c

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

tools/llm_bench/llm_bench_utils/ov_utils.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -132,7 +132,9 @@ def create_text_gen_model(model_path, device, memory_monitor, **kwargs):
132132
else:
133133
log.info("Selected OpenVINO GenAI for benchmarking")
134134
return create_genai_text_gen_model(model_path, device, ov_config, memory_monitor, **kwargs)
135+
135136
log.info("Selected Optimum Intel for benchmarking")
137+
ov_config.pop("ATTENTION_BACKEND", None)
136138
remote_code = False
137139
try:
138140
model_config = AutoConfig.from_pretrained(model_path, trust_remote_code=False)
@@ -541,7 +543,7 @@ def create_speech_2_txt_model(model_path, device, memory_monitor, **kwargs):
541543
else:
542544
if kwargs.get("genai", True) and is_genai_available(log_msg=True):
543545
if model_class not in [OV_MODEL_CLASSES_MAPPING[default_model_type]]:
544-
log.warning("OpenVINO GenAI based benchmarking is not available for {model_type}. Will be switched to default bencmarking")
546+
log.warning("OpenVINO GenAI based benchmarking is not available for {model_type}. Will be switched to default benchmarking")
545547
else:
546548
log.info("Selected OpenVINO GenAI for benchmarking")
547549
return create_genai_speech_2_txt_model(model_path, device, memory_monitor, **kwargs)

0 commit comments

Comments
 (0)