File tree Expand file tree Collapse file tree 1 file changed +1
-1
lines changed
src/plugins/intel_gpu/src/graph/impls/ocl_v2/sdpa Expand file tree Collapse file tree 1 file changed +1
-1
lines changed Original file line number Diff line number Diff line change @@ -123,7 +123,7 @@ class SDPAOptImpl : public SDPAImplBase {
123
123
// So far this case was observed only from the non-lm models such as vision embedding model.
124
124
// If we need to optimize unaligned head size SDPA for 2nd+ token phase of LM model,
125
125
// we'll need to fix single_token kernel to support unaligned head size.
126
- if (is_prefill || unaligned_head_size (params )) {
126
+ if (is_prefill || unaligned_head_size (new_params )) {
127
127
GPU_DEBUG_TRACE_DETAIL << " execute multi_tokens for prefill with indirect = " << is_indirect << " \n " ;
128
128
return execute_stage (events, instance, is_indirect ? indirect_multi_tokens : regular_multi_tokens);
129
129
}
You can’t perform that action at this time.
0 commit comments