improved autotune engine

[hashcat.git] / src / oclHashcat.c
diff --git a/src/oclHashcat.c b/src/oclHashcat.c

index 1c8634e..035a97d 100644 (file)
--- a/src/oclHashcat.c
+++ b/src/oclHashcat.c
@@ -3018,6 +3018,20 @@ static void autotune (hc_device_param_t *device_param)
      }
    }
  
+  // because of the balance we may have some free space left!
+  // at this point, allow a small variance to overdrive the limit
+
+  const int exec_left = (target_ms * 1.2) / exec_best;
+
+  const int accel_left = kernel_accel_max / kernel_accel_best;
+
+  const int exec_accel_min = MIN (exec_left, accel_left);
+
+  if (exec_accel_min)
+  {
+    kernel_accel_best *= exec_accel_min;
+  }
+
    // reset timer
  
    device_param->exec_pos = 0;
@@ -5323,6 +5337,9 @@ int main (int argc, char **argv)
    if (getenv ("CUDA_CACHE_DISABLE") == NULL)
      putenv ((char *) "CUDA_CACHE_DISABLE=1");
  
+  if (getenv ("POCL_KERNEL_CACHE") == NULL)
+    putenv ((char *) "POCL_KERNEL_CACHE=0");
+
    /**
     * Real init
     */
@@ -13940,7 +13957,7 @@ int main (int argc, char **argv)
  
        // we don't have sm_* on vendors not NV but it doesn't matter
  
-      snprintf (build_opts, sizeof (build_opts) - 1, "-I\"%s/\" -DVENDOR_ID=%u -DCUDA_ARCH=%d -DVECT_SIZE=%u -DDEVICE_TYPE=%u", shared_dir, device_param->vendor_id, (device_param->sm_major * 100) + device_param->sm_minor, device_param->vector_width, (u32) device_param->device_type);
+      snprintf (build_opts, sizeof (build_opts) - 1, "-cl-std=CL1.1 -I\"%s/\" -DVENDOR_ID=%u -DCUDA_ARCH=%d -DVECT_SIZE=%u -DDEVICE_TYPE=%u", shared_dir, device_param->vendor_id, (device_param->sm_major * 100) + device_param->sm_minor, device_param->vector_width, (u32) device_param->device_type);
  
        /**
         * main kernel