|
|
|
@ -64,6 +64,12 @@ char *module_jit_build_options (MAYBE_UNUSED const hashconfig_t *hashconfig, MAY
|
|
|
|
|
}
|
|
|
|
|
else if (device_param->opencl_device_type & CL_DEVICE_TYPE_GPU)
|
|
|
|
|
{
|
|
|
|
|
#if defined (__APPLE__)
|
|
|
|
|
|
|
|
|
|
native_threads = 32;
|
|
|
|
|
|
|
|
|
|
#else
|
|
|
|
|
|
|
|
|
|
if (device_param->device_local_mem_size < 49152)
|
|
|
|
|
{
|
|
|
|
|
native_threads = MIN (device_param->kernel_preferred_wgs_multiple, 32); // We can't just set 32, because Intel GPU need 8
|
|
|
|
@ -72,6 +78,8 @@ char *module_jit_build_options (MAYBE_UNUSED const hashconfig_t *hashconfig, MAY
|
|
|
|
|
{
|
|
|
|
|
native_threads = device_param->kernel_preferred_wgs_multiple;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#endif
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
hc_asprintf (&jit_build_options, "-D FIXED_LOCAL_SIZE=%u -D _unroll", native_threads);
|
|
|
|
|