[GPU] Relax batch size limitaions for DO GPU implementation usage for some of Gen12HP dGPUs (#8801)

This commit is contained in:
Sergey Shlyapnikov
2021-11-29 05:41:39 +03:00
committed by GitHub
parent a09f4ded79
commit 497aaf9b46

View File

@@ -1164,7 +1164,9 @@ impl_types layout_optimizer::get_preferred_impl_type(program_node& node, format
auto& detection_output_node = node.as<detection_output>();
auto confidence_layout = detection_output_node.confidence().get_output_layout();
auto prim = detection_output_node.get_primitive();
if (confidence_layout.size.batch[0] <= lws_max && confidence_layout.size.batch[0] >= 4 && prim->confidence_threshold >= 0.1 &&
auto batch_size_limitations = (device_info.supports_immad && device_info.execution_units_count >= 256) ? true : confidence_layout.size.batch[0] >= 4;
if (confidence_layout.size.batch[0] <= lws_max && batch_size_limitations &&
prim->confidence_threshold >= 0.1 &&
prim->top_k <= 400 && prim->num_classes >= 16 && confidence_layout.size.feature[0] > 10000)
preferred_impl = impl_types::ocl;
else