Reduce max kernel threads from 256 to 64 in -w 4 to save host and GPU memory

2025-04-05 01:06:00 +00:00 · 2018-02-06 09:38:54 +01:00 · 2018-02-06 09:38:54 +01:00 · cdc4f3828b
commit cdc4f3828b
parent 5391edca0d
1 changed files with 3 additions and 2 deletions
--- a/src/interface.c
+++ b/src/interface.c
@ -26023,9 +26023,10 @@ u32 hashconfig_get_kernel_threads (hashcat_ctx_t *hashcat_ctx, const hc_device_p
  // kernel_accel_max to be a very low number because the pws buffer will be so large otherwise.
  // therefore autotune will be unable to calculate a good kernel_accel multiplier.
  // currently there's no OpenCL device known that needs result in a better performance with 1024 threads compared to 256.
-  // as a result, we limit the number of threads to 256, which turns out to be a general good value.
+  // as a result, we limit the number of threads to 64, which turns out to be a general good value.
+  // there's a 1.00% - 2.75% performance drop at NV caused by this, and 0.00% - 1.02% at AMD.

-  kernel_threads = MIN (kernel_threads, 256);
+  kernel_threads = MIN (kernel_threads, 64);

  return kernel_threads;
 }