[GPU] Skip FC fake alignment for some vector by matrix multiplications (#17051)
This commit is contained in:
parent
eac265722f
commit
e8ae1e41ea
@ -176,9 +176,15 @@ kernel_impl_params fully_connected_inst::get_fake_aligned_params(kernel_impl_par
|
||||
auto updated_param = orig_impl_param;
|
||||
auto input_shape = orig_input_layout.get_partial_shape().to_shape();
|
||||
auto input_row_idx = input_shape.size() - 2;
|
||||
input_shape[input_row_idx] = align_to(input_shape[input_row_idx], 8);
|
||||
auto output_shape = orig_output_layout.get_partial_shape().to_shape();
|
||||
auto output_row_idx = output_shape.size() - 2;
|
||||
|
||||
// Vector by matrix multiplication sometimes works slower if we align it
|
||||
if (input_shape[input_row_idx] == 1 && output_shape[output_row_idx] == 1 && input_shape[input_shape.size() - 1] >= 1024) {
|
||||
return std::move(orig_impl_param);
|
||||
}
|
||||
|
||||
input_shape[input_row_idx] = align_to(input_shape[input_row_idx], 8);
|
||||
output_shape[output_row_idx] = align_to(output_shape[output_row_idx], 8);
|
||||
|
||||
updated_param.input_layouts[0] = layout(ov::PartialShape(input_shape),
|
||||
|
Loading…
Reference in New Issue
Block a user