Hi,
I'm attempting to run
c:\PyFR-1.7.5\examples\euler_vortex_2d>mpiexec -n 2 pyfr run -b cuda -p
euler_vortex_2d.pyfrm euler_vortex_2d.ini
with the change in .ini file from
device-id = round-robin
to
device-id = local-rank
.
I get
pycuda.driver.CompileError: nvcc compilation of
C:\Users\admin\AppData\Local\Temp\tmpinwerlob\kernel.cu failed
[command: nvcc --cubin -arch sm_20 -m64
-Ic:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pycuda\cuda
kernel.cu]
[stdout:
nvcc fatal : Value 'sm_20' is not defined for option 'gpu-architecture'
]
.
My understanding (from googling the error) is that sm_20 can not be used
with cuda 9. I don't know how (or where) to change this flag to sm_30 which
should work(?). (I've tried to set the enviroment variable CUDA_NVCC_FLAGS
"-arch=sm_30, but it makes no difference. I still get Value 'sm_20' is not
defined for option 'gpu-architecture')
I guess changing from sm_20 to sm_30 (or something) is what I want to do?
Can anyone help me with how to do that?
Running on Windows 10, cuda 9.1 with a 1080 ti (and a gtx 470).
I'm attaching the complete output I get from running the program.
Best regards,
Magnus
--
You received this message because you are subscribed to the Google Groups "PyFR
Mailing List" group.
To unsubscribe from this group and stop receiving emails from it, send an email
to [email protected].
To post to this group, send an email to [email protected].
Visit this group at https://groups.google.com/group/pyfrmailinglist.
For more options, visit https://groups.google.com/d/optout.
c:\PyFR-1.7.5\examples\euler_vortex_2d>mpiexec -n 2 pyfr run -b cuda -p
euler_vortex_2d.pyfrm euler_vortex_2d.ini
c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\h5py\__init__.py:36:
FutureWarning: Conversion of the second argument of issubdtype from `float` to
`np.floating` is deprecated. In future, it will be treated as `np.float64 ==
np.dtype(float).type`.
from ._conv import register_converters as _register_converters
Traceback (most recent call last):
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\util.py",
line 33, in __call__
res = cache[key]
KeyError: (<function CUDAKernelProvider._build_kernel at 0x000001ECE5C18AE8>,
b'\x80\x03X\t\x00\x00\x00gimmik_mmq\x00X,\x0c\x00\x00\n__global__
void\ngimmik_mm(int n,\n const double* __restrict__ b, int ldb,\n
double* __restrict__ c, int ldc)\n{\n int i = blockDim.x*blockIdx.x +
threadIdx.x;\n double dotp;\n\n if (i < n)\n {\n dotp =
1.5267881254572668*b[i + 0*ldb] + -0.8136324494869274*b[i + 4*ldb] +
0.4007615203116505*b[i + 8*ldb] + -0.11391719628199*b[i + 12*ldb];\n c[i
+ 0*ldc] = dotp;\n dotp = 1.5267881254572668*b[i + 1*ldb] +
-0.8136324494869274*b[i + 5*ldb] + 0.4007615203116505*b[i + 9*ldb] +
-0.11391719628199*b[i + 13*ldb];\n c[i + 1*ldc] = dotp;\n dotp =
1.5267881254572668*b[i + 2*ldb] + -0.8136324494869274*b[i + 6*ldb] +
0.4007615203116505*b[i + 10*ldb] + -0.11391719628199*b[i + 14*ldb];\n
c[i + 2*ldc] = dotp;\n dotp = 1.5267881254572668*b[i + 3*ldb] +
-0.8136324494869274*b[i + 7*ldb] + 0.4007615203116505*b[i + 11*ldb] +
-0.11391719628199*b[i + 15*ldb];\n c[i + 3*ldc] = dotp;\n dotp =
-0.11391719628199*b[i + 0*ldb] + 0.4007615203116505*b[i + 1*ldb] +
-0.8136324494869274*b[i + 2*ldb] + 1.5267881254572668*b[i + 3*ldb];\n
c[i + 4*ldc] = dotp;\n dotp = -0.11391719628199*b[i + 4*ldb] +
0.4007615203116505*b[i + 5*ldb] + -0.8136324494869274*b[i + 6*ldb] +
1.5267881254572668*b[i + 7*ldb];\n c[i + 5*ldc] = dotp;\n dotp =
-0.11391719628199*b[i + 8*ldb] + 0.4007615203116505*b[i + 9*ldb] +
-0.8136324494869274*b[i + 10*ldb] + 1.5267881254572668*b[i + 11*ldb];\n
c[i + 6*ldc] = dotp;\n dotp = -0.11391719628199*b[i + 12*ldb] +
0.4007615203116505*b[i + 13*ldb] + -0.8136324494869274*b[i + 14*ldb] +
1.5267881254572668*b[i + 15*ldb];\n c[i + 7*ldc] = dotp;\n dotp =
-0.11391719628199*b[i + 0*ldb] + 0.4007615203116505*b[i + 4*ldb] +
-0.8136324494869274*b[i + 8*ldb] + 1.5267881254572668*b[i + 12*ldb];\n
c[i + 8*ldc] = dotp;\n dotp = -0.11391719628199*b[i + 1*ldb] +
0.4007615203116505*b[i + 5*ldb] + -0.8136324494869274*b[i + 9*ldb] +
1.5267881254572668*b[i + 13*ldb];\n c[i + 9*ldc] = dotp;\n dotp =
-0.11391719628199*b[i + 2*ldb] + 0.4007615203116505*b[i + 6*ldb] +
-0.8136324494869274*b[i + 10*ldb] + 1.5267881254572668*b[i + 14*ldb];\n
c[i + 10*ldc] = dotp;\n dotp = -0.11391719628199*b[i + 3*ldb] +
0.4007615203116505*b[i + 7*ldb] + -0.8136324494869274*b[i + 11*ldb] +
1.5267881254572668*b[i + 15*ldb];\n c[i + 11*ldc] = dotp;\n dotp
= 1.5267881254572668*b[i + 0*ldb] + -0.8136324494869274*b[i + 1*ldb] +
0.4007615203116505*b[i + 2*ldb] + -0.11391719628199*b[i + 3*ldb];\n c[i
+ 12*ldc] = dotp;\n dotp = 1.5267881254572668*b[i + 4*ldb] +
-0.8136324494869274*b[i + 5*ldb] + 0.4007615203116505*b[i + 6*ldb] +
-0.11391719628199*b[i + 7*ldb];\n c[i + 13*ldc] = dotp;\n dotp =
1.5267881254572668*b[i + 8*ldb] + -0.8136324494869274*b[i + 9*ldb] +
0.4007615203116505*b[i + 10*ldb] + -0.11391719628199*b[i + 11*ldb];\n
c[i + 14*ldc] = dotp;\n dotp = 1.5267881254572668*b[i + 12*ldb] +
-0.8136324494869274*b[i + 13*ldb] + 0.4007615203116505*b[i + 14*ldb] +
-0.11391719628199*b[i + 15*ldb];\n c[i + 15*ldc] = dotp;\n
}\n}\nq\x01X\x05\x00\x00\x00iPiPiq\x02\x87q\x03.', b'\x80\x03}q\x00.')
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "c:\users\admin\appdata\local\programs\python\python36\lib\runpy.py",
line 193, in _run_module_as_main
"__main__", mod_spec)
File "c:\users\admin\appdata\local\programs\python\python36\lib\runpy.py",
line 85, in _run_code
exec(code, run_globals)
File
"C:\Users\admin\AppData\Local\Programs\Python\Python36\Scripts\pyfr.exe\__main__.py",
line 9, in <module>
mpi4py.rc.initialize = False
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\__main__.py",
line 110, in main
args.process(args)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\__main__.py",
line 235, in process_run
args, NativeReader(args.mesh), None, Inifile.load(args.cfg)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\__main__.py",
line 216, in _process_common
solver = get_solver(backend, rallocs, mesh, soln, cfg)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\solvers\__init__.py",
line 16, in get_solver
return get_integrator(backend, systemcls, rallocs, mesh, initsoln, cfg)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\integrators\__init__.py",
line 46, in get_integrator
return integrator(backend, systemcls, rallocs, mesh, initsoln, cfg)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\integrators\std\controllers.py",
line 14, in __init__
super().__init__(*args, **kwargs)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\integrators\std\steppers.py",
line 8, in __init__
super().__init__(*args, **kwargs)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\integrators\std\base.py",
line 10, in __init__
super().__init__(*args, **kwargs)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\integrators\base.py",
line 58, in __init__
self._init_system(systemcls, backend, rallocs, mesh, initsoln)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\integrators\base.py",
line 88, in _init_system
self.system = systemcls(*args, nreg=self.nreg, cfg=self.cfg)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\solvers\base\system.py",
line 65, in __init__
self._gen_kernels(eles, int_inters, mpi_inters, bc_inters)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\solvers\base\system.py",
line 174, in _gen_kernels
kernels[pn, kn].append(kgetter())
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\solvers\baseadvec\elements.py",
line 57, in <lambda>
out=self._scal_fpts
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\backends\base\backend.py",
line 166, in kernel
return kern(*args, **kwargs)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\backends\cuda\gimmik.py",
line 36, in mul
fun = self._build_kernel('gimmik_mm', src, 'iPiPi')
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\util.py",
line 35, in __call__
res = cache[key] = self.func(*args, **kwargs)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pyfr\backends\cuda\provider.py",
line 20, in _build_kernel
fun = compiler.SourceModule(src).get_function(name)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pycuda\compiler.py",
line 291, in __init__
arch, code, cache_dir, include_dirs)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pycuda\compiler.py",
line 255, in compile
return compile_plain(source, options, keep, nvcc, cache_dir, target)
File
"c:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pycuda\compiler.py",
line 137, in compile_plain
stderr=stderr.decode("utf-8", "replace"))
pycuda.driver.CompileError: nvcc compilation of
C:\Users\admin\AppData\Local\Temp\tmpinwerlob\kernel.cu failed
[command: nvcc --cubin -arch sm_20 -m64
-Ic:\users\admin\appdata\local\programs\python\python36\lib\site-packages\pycuda\cuda
kernel.cu]
[stdout:
nvcc fatal : Value 'sm_20' is not defined for option 'gpu-architecture'
]
job aborted:
[ranks] message
[0] terminated
[1] application aborted
aborting MPI_COMM_WORLD (comm=0x44000000), error 1, comm rank 1
---- error analysis -----
[1] on BEAST
pyfr aborted the job. abort code 1
---- error analysis -----