Skip to content

Commit 0047931

Browse files
authored
[llm bench] Turn off PA backend for VLM (#2312)
1 parent da7a5a5 commit 0047931

File tree

1 file changed

+7
-3
lines changed

1 file changed

+7
-3
lines changed

tools/llm_bench/llm_bench_utils/model_utils.py

Lines changed: 7 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,8 @@
1010
USE_CASES,
1111
OV_MODEL_CLASSES_MAPPING,
1212
PT_MODEL_CLASSES_MAPPING,
13-
PA_ATTENTION_BACKEND
13+
PA_ATTENTION_BACKEND,
14+
SDPA_ATTENTION_BACKEND
1415
)
1516
import librosa
1617

@@ -183,8 +184,11 @@ def analyze_args(args):
183184
model_args['config'] = config
184185
if model_framework == 'ov':
185186
set_default_param_for_ov_config(model_args['config'])
186-
if 'ATTENTION_BACKEND' not in model_args['config'] and use_case in ['text_gen', 'vlm'] and args.device != "NPU" and not optimum:
187-
model_args['config']['ATTENTION_BACKEND'] = PA_ATTENTION_BACKEND
187+
if 'ATTENTION_BACKEND' not in model_args['config'] and not optimum:
188+
if use_case in ['text_gen'] and args.device != "NPU":
189+
model_args['config']['ATTENTION_BACKEND'] = PA_ATTENTION_BACKEND
190+
elif use_case in ['vlm']:
191+
model_args['config']['ATTENTION_BACKEND'] = SDPA_ATTENTION_BACKEND
188192
log.info(f"OV Config={model_args['config']}")
189193
elif model_framework == 'pt':
190194
log.info(f"PT Config={model_args['config']}")

0 commit comments

Comments
 (0)