More vendor related changes

[hashcat.git] / src / hashcat.c
diff --git a/src/hashcat.c b/src/hashcat.c

index 062a8a8..7f67789 100644 (file)
--- a/src/hashcat.c
+++ b/src/hashcat.c
@@ -1570,11 +1570,11 @@ void status_display ()
          hm_device_val_to_str ((char *) utilization, HM_STR_BUF_SIZE, "%", hm_get_utilization_with_device_id (device_id));
          hm_device_val_to_str ((char *) temperature, HM_STR_BUF_SIZE, "c", hm_get_temperature_with_device_id (device_id));
  
-        if (device_param->vendor_id == VENDOR_ID_AMD)
+        if (device_param->device_vendor_id == VENDOR_ID_AMD)
          {
            hm_device_val_to_str ((char *) fanspeed, HM_STR_BUF_SIZE, "%", hm_get_fanspeed_with_device_id (device_id));
          }
-        else if (device_param->vendor_id == VENDOR_ID_NV)
+        else if (device_param->device_vendor_id == VENDOR_ID_NV)
          {
            hm_device_val_to_str ((char *) fanspeed, HM_STR_BUF_SIZE, "%", hm_get_fanspeed_with_device_id (device_id));
          }
@@ -2613,7 +2613,7 @@ static void run_kernel_bzero (hc_device_param_t *device_param, cl_mem buf, const
  {
    int rc = -1;
  
-  if (device_param->opencl_v12 && device_param->vendor_id == VENDOR_ID_AMD)
+  if (device_param->opencl_v12 && device_param->platform_vendor_id == VENDOR_ID_AMD)
    {
      // So far tested, amd is the only supporting this OpenCL 1.2 function without segfaulting
  
@@ -2975,16 +2975,27 @@ static void autotune (hc_device_param_t *device_param)
      exec_ms_pre_final = MIN (exec_ms_pre_final, exec_ms_pre_final_v);
    }
  
+  u32 diff = kernel_loops - kernel_accel;
+
    if ((kernel_loops_min < kernel_loops_max) && (kernel_accel_min < kernel_accel_max))
    {
-    for (u32 f = 2; f < 1024; f++)
+    u32 kernel_accel_orig = kernel_accel;
+    u32 kernel_loops_orig = kernel_loops;
+
+    for (u32 f = 1; f < 1024; f++)
      {
-      const u32 kernel_accel_try = kernel_accel * f;
-      const u32 kernel_loops_try = kernel_loops / f;
+      const u32 kernel_accel_try = (float) kernel_accel_orig * f;
+      const u32 kernel_loops_try = (float) kernel_loops_orig / f;
  
        if (kernel_accel_try > kernel_accel_max) break;
        if (kernel_loops_try < kernel_loops_min) break;
  
+      u32 diff_new = kernel_loops_try - kernel_accel_try;
+
+      if (diff_new > diff) break;
+
+      diff_new = diff;
+
        double exec_ms = try_run (device_param, kernel_accel_try, kernel_loops_try);
  
        for (int i = 0; i < VERIFIER_CNT; i++)
@@ -13205,39 +13216,43 @@ int main (int argc, char **argv)
        // this causes trouble with vendor id based macros
        // we'll assign generic to those without special optimization available
  
-      cl_uint vendor_id = 0;
+      cl_uint platform_vendor_id = 0;
  
        if (strcmp (platform_vendor, CL_VENDOR_AMD) == 0)
        {
-        vendor_id = VENDOR_ID_AMD;
+        platform_vendor_id = VENDOR_ID_AMD;
+      }
+      else if (strcmp (platform_vendor, CL_VENDOR_AMD_USE_INTEL) == 0)
+      {
+        platform_vendor_id = VENDOR_ID_AMD_USE_INTEL;
        }
        else if (strcmp (platform_vendor, CL_VENDOR_APPLE) == 0)
        {
-        vendor_id = VENDOR_ID_APPLE;
+        platform_vendor_id = VENDOR_ID_APPLE;
        }
        else if (strcmp (platform_vendor, CL_VENDOR_INTEL_BEIGNET) == 0)
        {
-        vendor_id = VENDOR_ID_INTEL_BEIGNET;
+        platform_vendor_id = VENDOR_ID_INTEL_BEIGNET;
        }
        else if (strcmp (platform_vendor, CL_VENDOR_INTEL_SDK) == 0)
        {
-        vendor_id = VENDOR_ID_INTEL_SDK;
+        platform_vendor_id = VENDOR_ID_INTEL_SDK;
        }
        else if (strcmp (platform_vendor, CL_VENDOR_MESA) == 0)
        {
-        vendor_id = VENDOR_ID_MESA;
+        platform_vendor_id = VENDOR_ID_MESA;
        }
        else if (strcmp (platform_vendor, CL_VENDOR_NV) == 0)
        {
-        vendor_id = VENDOR_ID_NV;
+        platform_vendor_id = VENDOR_ID_NV;
        }
        else if (strcmp (platform_vendor, CL_VENDOR_POCL) == 0)
        {
-        vendor_id = VENDOR_ID_POCL;
+        platform_vendor_id = VENDOR_ID_POCL;
        }
        else
        {
-        vendor_id = VENDOR_ID_GENERIC;
+        platform_vendor_id = VENDOR_ID_GENERIC;
        }
  
        for (uint platform_devices_id = 0; platform_devices_id < platform_devices_cnt; platform_devices_id++)
@@ -13248,7 +13263,7 @@ int main (int argc, char **argv)
  
          hc_device_param_t *device_param = &data.devices_param[device_id];
  
-        device_param->vendor_id = vendor_id;
+        device_param->platform_vendor_id = platform_vendor_id;
  
          device_param->device = platform_devices[platform_devices_id];
  
@@ -13276,6 +13291,57 @@ int main (int argc, char **argv)
  
          device_param->device_name = device_name;
  
+        // device_vendor
+
+        hc_clGetDeviceInfo (data.ocl, device_param->device, CL_DEVICE_VENDOR, 0, NULL, &param_value_size);
+
+        char *device_vendor = (char *) mymalloc (param_value_size);
+
+        hc_clGetDeviceInfo (data.ocl, device_param->device, CL_DEVICE_VENDOR, param_value_size, device_vendor, NULL);
+
+        device_param->device_vendor = device_vendor;
+
+        cl_uint device_vendor_id = 0;
+
+        if (strcmp (device_vendor, CL_VENDOR_AMD) == 0)
+        {
+          device_vendor_id = VENDOR_ID_AMD;
+        }
+        else if (strcmp (device_vendor, CL_VENDOR_AMD_USE_INTEL) == 0)
+        {
+          device_vendor_id = VENDOR_ID_AMD_USE_INTEL;
+        }
+        else if (strcmp (device_vendor, CL_VENDOR_APPLE) == 0)
+        {
+          device_vendor_id = VENDOR_ID_APPLE;
+        }
+        else if (strcmp (device_vendor, CL_VENDOR_INTEL_BEIGNET) == 0)
+        {
+          device_vendor_id = VENDOR_ID_INTEL_BEIGNET;
+        }
+        else if (strcmp (device_vendor, CL_VENDOR_INTEL_SDK) == 0)
+        {
+          device_vendor_id = VENDOR_ID_INTEL_SDK;
+        }
+        else if (strcmp (device_vendor, CL_VENDOR_MESA) == 0)
+        {
+          device_vendor_id = VENDOR_ID_MESA;
+        }
+        else if (strcmp (device_vendor, CL_VENDOR_NV) == 0)
+        {
+          device_vendor_id = VENDOR_ID_NV;
+        }
+        else if (strcmp (device_vendor, CL_VENDOR_POCL) == 0)
+        {
+          device_vendor_id = VENDOR_ID_POCL;
+        }
+        else
+        {
+          device_vendor_id = VENDOR_ID_GENERIC;
+        }
+
+        device_param->device_vendor_id = device_vendor_id;
+
          // tuning db
  
          tuning_db_entry_t *tuningdb_entry = tuning_db_search (tuning_db, device_param, attack_mode, hash_mode);
@@ -13382,7 +13448,7 @@ int main (int argc, char **argv)
  
          if (device_endian_little == CL_FALSE)
          {
-          log_info ("Device #%u: WARNING: not little endian device", device_id + 1);
+          if (data.quiet == 0) log_info ("Device #%u: WARNING: not little endian device", device_id + 1);
  
            device_param->skipped = 1;
          }
@@ -13395,7 +13461,7 @@ int main (int argc, char **argv)
  
          if (device_available == CL_FALSE)
          {
-          log_info ("Device #%u: WARNING: device not available", device_id + 1);
+          if (data.quiet == 0) log_info ("Device #%u: WARNING: device not available", device_id + 1);
  
            device_param->skipped = 1;
          }
@@ -13408,7 +13474,7 @@ int main (int argc, char **argv)
  
          if (device_compiler_available == CL_FALSE)
          {
-          log_info ("Device #%u: WARNING: device no compiler available", device_id + 1);
+          if (data.quiet == 0) log_info ("Device #%u: WARNING: device no compiler available", device_id + 1);
  
            device_param->skipped = 1;
          }
@@ -13421,7 +13487,7 @@ int main (int argc, char **argv)
  
          if ((device_execution_capabilities & CL_EXEC_KERNEL) == 0)
          {
-          log_info ("Device #%u: WARNING: device does not support executing kernels", device_id + 1);
+          if (data.quiet == 0) log_info ("Device #%u: WARNING: device does not support executing kernels", device_id + 1);
  
            device_param->skipped = 1;
          }
@@ -13438,14 +13504,14 @@ int main (int argc, char **argv)
  
          if (strstr (device_extensions, "base_atomics") == 0)
          {
-          log_info ("Device #%u: WARNING: device does not support base atomics", device_id + 1);
+          if (data.quiet == 0) log_info ("Device #%u: WARNING: device does not support base atomics", device_id + 1);
  
            device_param->skipped = 1;
          }
  
          if (strstr (device_extensions, "byte_addressable_store") == 0)
          {
-          log_info ("Device #%u: WARNING: device does not support byte addressable store", device_id + 1);
+          if (data.quiet == 0) log_info ("Device #%u: WARNING: device does not support byte addressable store", device_id + 1);
  
            device_param->skipped = 1;
          }
@@ -13460,11 +13526,26 @@ int main (int argc, char **argv)
  
          if (device_local_mem_size < 32768)
          {
-          log_info ("Device #%u: WARNING: device local mem size is too small", device_id + 1);
+          if (data.quiet == 0) log_info ("Device #%u: WARNING: device local mem size is too small", device_id + 1);
  
            device_param->skipped = 1;
          }
  
+        // If there's both an Intel CPU and an AMD OpenCL runtime it's a tricky situation
+        // Both platforms support CPU device types and therefore both will try to use 100% of the physical resources
+        // This results in both utilizing it for 50%
+        // However, Intel has much better SIMD control over their own hardware
+        // It makes sense to give them full control over their own hardware
+
+        if (device_type & CL_DEVICE_TYPE_CPU)
+        {
+          if (device_param->device_vendor_id == VENDOR_ID_AMD_USE_INTEL)
+          {
+            if (data.quiet == 0) log_info ("Device #%u: WARNING: not native intel opencl platform", device_id + 1);
+
+            device_param->skipped = 1;
+          }
+        }
  
          // skipped
  
@@ -13486,9 +13567,9 @@ int main (int argc, char **argv)
          char *device_name_chksum = (char *) mymalloc (INFOSZ);
  
          #if __x86_64__
-        snprintf (device_name_chksum, INFOSZ - 1, "%u-%u-%u-%s-%s-%s-%u", 64, device_param->vendor_id, device_param->vector_width, device_param->device_name, device_param->device_version, device_param->driver_version, COMPTIME);
+        snprintf (device_name_chksum, INFOSZ - 1, "%u-%u-%u-%s-%s-%s-%u", 64, device_param->platform_vendor_id, device_param->vector_width, device_param->device_name, device_param->device_version, device_param->driver_version, COMPTIME);
          #else
-        snprintf (device_name_chksum, INFOSZ - 1, "%u-%u-%u-%s-%s-%s-%u", 32, device_param->vendor_id, device_param->vector_width, device_param->device_name, device_param->device_version, device_param->driver_version, COMPTIME);
+        snprintf (device_name_chksum, INFOSZ - 1, "%u-%u-%u-%s-%s-%s-%u", 32, device_param->platform_vendor_id, device_param->vector_width, device_param->device_name, device_param->device_version, device_param->driver_version, COMPTIME);
          #endif
  
          uint device_name_digest[4] = { 0 };
@@ -13510,7 +13591,7 @@ int main (int argc, char **argv)
  
          if (device_type & CL_DEVICE_TYPE_GPU)
          {
-          if (vendor_id == VENDOR_ID_AMD)
+          if (device_vendor_id == VENDOR_ID_AMD)
            {
              cl_uint device_processor_cores = 0;
  
@@ -13520,7 +13601,7 @@ int main (int argc, char **argv)
  
              device_param->device_processor_cores = device_processor_cores;
            }
-          else if (vendor_id == VENDOR_ID_NV)
+          else if (device_vendor_id == VENDOR_ID_NV)
            {
              cl_uint kernel_exec_timeout = 0;
  
@@ -13589,7 +13670,7 @@ int main (int argc, char **argv)
          {
            if (device_type & CL_DEVICE_TYPE_GPU)
            {
-            if (vendor_id == VENDOR_ID_AMD)
+            if (platform_vendor_id == VENDOR_ID_AMD)
              {
                int catalyst_check = (force == 1) ? 0 : 1;
  
@@ -13637,7 +13718,7 @@ int main (int argc, char **argv)
                  return (-1);
                }
              }
-            else if (vendor_id == VENDOR_ID_NV)
+            else if (platform_vendor_id == VENDOR_ID_NV)
              {
                if (device_param->kernel_exec_timeout != 0)
                {
@@ -13650,7 +13731,7 @@ int main (int argc, char **argv)
            /* turns out pocl still creates segfaults (because of llvm)
            if (device_type & CL_DEVICE_TYPE_CPU)
            {
-            if (vendor_id == VENDOR_ID_AMD)
+            if (platform_vendor_id == VENDOR_ID_AMD)
              {
                if (force == 0)
                {
@@ -14030,14 +14111,14 @@ int main (int argc, char **argv)
          const uint platform_devices_id = device_param->platform_devices_id;
  
          #if defined(HAVE_NVML) || defined(HAVE_NVAPI)
-        if (device_param->vendor_id == VENDOR_ID_NV)
+        if (device_param->device_vendor_id == VENDOR_ID_NV)
          {
            memcpy (&data.hm_device[device_id], &hm_adapters_nv[platform_devices_id], sizeof (hm_attrs_t));
          }
          #endif
  
          #ifdef HAVE_ADL
-        if (device_param->vendor_id == VENDOR_ID_AMD)
+        if (device_param->device_vendor_id == VENDOR_ID_AMD)
          {
            memcpy (&data.hm_device[device_id], &hm_adapters_amd[platform_devices_id], sizeof (hm_attrs_t));
          }
@@ -14225,22 +14306,22 @@ int main (int argc, char **argv)
  
            if (hash_mode == 8900)
            {
-            if (device_param->vendor_id == VENDOR_ID_AMD)
+            if (device_param->device_vendor_id == VENDOR_ID_AMD)
              {
                tmto_start = 1;
              }
-            else if (device_param->vendor_id == VENDOR_ID_NV)
+            else if (device_param->device_vendor_id == VENDOR_ID_NV)
              {
                tmto_start = 2;
              }
            }
            else if (hash_mode == 9300)
            {
-            if (device_param->vendor_id == VENDOR_ID_AMD)
+            if (device_param->device_vendor_id == VENDOR_ID_AMD)
              {
                tmto_start = 2;
              }
-            else if (device_param->vendor_id == VENDOR_ID_NV)
+            else if (device_param->device_vendor_id == VENDOR_ID_NV)
              {
                tmto_start = 2;
              }
@@ -14568,12 +14649,12 @@ int main (int argc, char **argv)
  
        char build_opts_new[1024] = { 0 };
  
-      snprintf (build_opts_new, sizeof (build_opts_new) - 1, "%s -DVENDOR_ID=%u -DCUDA_ARCH=%d -DVECT_SIZE=%u -DDEVICE_TYPE=%u -DKERN_TYPE=%u -D_unroll -cl-std=CL1.1", build_opts, device_param->vendor_id, (device_param->sm_major * 100) + device_param->sm_minor, device_param->vector_width, (u32) device_param->device_type, kern_type);
+      snprintf (build_opts_new, sizeof (build_opts_new) - 1, "%s -DVENDOR_ID=%u -DCUDA_ARCH=%d -DVECT_SIZE=%u -DDEVICE_TYPE=%u -DKERN_TYPE=%u -D_unroll -cl-std=CL1.1", build_opts, device_param->device_vendor_id, (device_param->sm_major * 100) + device_param->sm_minor, device_param->vector_width, (u32) device_param->device_type, kern_type);
  
        strncpy (build_opts, build_opts_new, sizeof (build_opts) - 1);
  
-
-      if (device_param->vendor_id == VENDOR_ID_INTEL_SDK)
+      /*
+      if (device_param->device_vendor_id == VENDOR_ID_INTEL_SDK)
        {
          // we do vectorizing much better than the auto-vectorizer
  
@@ -14581,6 +14662,7 @@ int main (int argc, char **argv)
  
          strncpy (build_opts, build_opts_new, sizeof (build_opts) - 1);
        }
+      */
  
        #ifdef DEBUG
        log_info ("Device #%u: build_opts '%s'\n", device_id + 1, build_opts);