add workaround for failing overhead estimation test on (Intel) GPUs that only support single precision

2023-07-18 13:24:11 -04:00
parent 34fcf1361f
commit 021eeae860
1 changed files with 8 additions and 1 deletions
--- a/lib/gpu/lal_device.cpp
+++ b/lib/gpu/lal_device.cpp
@ -745,7 +745,14 @@ void DeviceT::estimate_gpu_overhead(const int kernel_calls,
  gpu_overhead=0.0;
  gpu_driver_overhead=0.0;
-  for (int z=0; z<11; z++) {
+  // TODO: XXX
  // The following estimation currently fails on Intel GPUs
  // that do not support double precision with OpenCL error code -5.
  // Until we have a better solution, we just skip this test in this case.
  int zloops = 11;
  if (!gpu->double_precision()) zloops = 0;
  for (int z=0; z < zloops; z++) {
    gpu->sync();
    gpu_barrier();
    over_timer.start();