a40pyopencl 22-4500 (N,N)2,3,5,7,11,13float32inplaceAuto12023-11-28 20h23:06 +00h 00m 46s [ 512 tests] 0
pyvkfft-test --systematic --backend pyopencl --gpu a40 --max-nb-tests 0 --nproc 16 --ndim 2 --range 2 4500 --dst 3 --radix --inplace --norm 1 --range-mb 0 4100

ERRORS:

======================================================================
test_systematic  (backend='pyopencl', shape=(2048, 2048), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 408, in test_accuracy
    n2, ni = l2(d, d1_gpu.get()), li(d, d1_gpu.get())
                   ^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyopencl/array.py", line 921, in get
    ary, event1 = self._get(queue=queue, ary=ary, async_=async_, **kwargs)
                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyopencl/array.py", line 880, in _get
    event1 = cl.enqueue_copy(queue, ary, self.base_data,
             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyopencl/__init__.py", line 2009, in enqueue_copy
    return _cl._enqueue_read_buffer(queue, src, dest, **kwargs)
           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
pyopencl._cl.RuntimeError: clEnqueueReadBuffer failed: OUT_OF_RESOURCES

During handling of the above exception, another exception occurred:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 578, in test_accuracy_kwargs
    raise RuntimeError("An OpenCL RuntimeError was encountered")
RuntimeError: An OpenCL RuntimeError was encountered
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: An OpenCL RuntimeError was encountered

======================================================================
test_systematic  (backend='pyopencl', shape=(2187, 2187), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2187,2187) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2187,2187) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(2250, 2250), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2250,2250) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2250,2250) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(2288, 2288), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2288,2288) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2288,2288) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(2366, 2366), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2366,2366) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2366,2366) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(2420, 2420), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2420,2420) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2420,2420) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(2464, 2464), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2464,2464) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2464,2464) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(2535, 2535), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2535,2535) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2535,2535) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(2574, 2574), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2574,2574) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2574,2574) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(2640, 2640), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2640,2640) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2640,2640) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(2695, 2695), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2695,2695) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2695,2695) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(2704, 2704), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2704,2704) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2704,2704) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(2750, 2750), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2750,2750) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2750,2750) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(2860, 2860), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2860,2860) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2860,2860) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(2916, 2916), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2916,2916) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (2916,2916) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3024, 3024), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3024,3024) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3024,3024) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3042, 3042), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3042,3042) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3042,3042) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3087, 3087), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3087,3087) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3087,3087) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3146, 3146), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3146,3146) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3146,3146) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3200, 3200), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3200,3200) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3200,3200) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3276, 3276), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3276,3276) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3276,3276) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3380, 3380), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3380,3380) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3380,3380) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3432, 3432), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3432,3432) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3432,3432) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3465, 3465), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3465,3465) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3465,3465) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3549, 3549), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3549,3549) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3549,3549) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3640, 3640), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3640,3640) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3640,3640) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3750, 3750), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3750,3750) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3750,3750) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3773, 3773), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3773,3773) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3773,3773) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3872, 3872), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3872,3872) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3872,3872) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(3969, 3969), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3969,3969) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (3969,3969) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(4000, 4000), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4000,4000) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4000,4000) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(4050, 4050), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4050,4050) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4050,4050) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(4096, 4096), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 408, in test_accuracy
    n2, ni = l2(d, d1_gpu.get()), li(d, d1_gpu.get())
                   ^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyopencl/array.py", line 921, in get
    ary, event1 = self._get(queue=queue, ary=ary, async_=async_, **kwargs)
                  ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyopencl/array.py", line 880, in _get
    event1 = cl.enqueue_copy(queue, ary, self.base_data,
             ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyopencl/__init__.py", line 2009, in enqueue_copy
    return _cl._enqueue_read_buffer(queue, src, dest, **kwargs)
           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
pyopencl._cl.RuntimeError: clEnqueueReadBuffer failed: OUT_OF_RESOURCES

During handling of the above exception, another exception occurred:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 578, in test_accuracy_kwargs
    raise RuntimeError("An OpenCL RuntimeError was encountered")
RuntimeError: An OpenCL RuntimeError was encountered
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: An OpenCL RuntimeError was encountered

======================================================================
test_systematic  (backend='pyopencl', shape=(4116, 4116), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4116,4116) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4116,4116) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(4200, 4200), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4200,4200) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4200,4200) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(4235, 4235), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4235,4235) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4235,4235) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(4368, 4368), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4368,4368) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4368,4368) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(4394, 4394), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4394,4394) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4394,4394) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(4400, 4400), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4400,4400) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4400,4400) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(4459, 4459), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4459,4459) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4459,4459) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]

======================================================================
test_systematic  (backend='pyopencl', shape=(4480, 4480), ndim=2, dtype=dtype('float32'), norm=1, use_lut=False, inplace=True, r2c=False, dct=False, dst=3, fstride=False) [pyvkfft.test.test_fft.TestFFTSystematic]:
----------------------------------------------------------------------
multiprocessing.pool.RemoteTraceback: 
"""
Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 125, in worker
    result = (True, func(*args, **kwds))
                    ^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 573, in test_accuracy_kwargs
    t = test_accuracy(**kwargs)
        ^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/accuracy.py", line 303, in test_accuracy
    app = clVkFFTApp(d0.shape, d0.dtype, queue, ndim=ndim, norm=norm,
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/opencl.py", line 173, in __init__
    check_vkfft_result(res, shape, dtype, ndim, inplace, norm, r2c, dct, dst, axes, "opencl:%s:%s" %
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/base.py", line 420, in check_vkfft_result
    raise RuntimeError("VkFFT error %d: %s %s" % (res, r.name, s))
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4480,4480) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]
"""

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/site-packages/pyvkfft/test/test_fft.py", line 979, in test_systematic
    res = results.next(timeout=self.timeout * r)
          ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
  File "/home/esrf/favre/miniconda3/envs/pynx-py311-cu11.7/lib/python3.11/multiprocessing/pool.py", line 873, in next
    raise value
RuntimeError: VkFFT error 4031: VKFFT_ERROR_FAILED_TO_COMPILE_PROGRAM DST3 (4480,4480) float32 2D inplace norm=1 [opencl:NVIDIA CUDA:NVIDIA A40]