Floating point error with MPS Simulator. During contract_decompose function call. #147
-
Please refer to the end of discussion in this link (#109 (reply in thread)). As for the latest request, @yangcal, Permutter has NVIDIA A100 GPUs. As for the script, the code executes withtout an error. |
Beta Was this translation helpful? Give feedback.
Replies: 3 comments 14 replies
-
Thanks for sharing your finding, which seems to be a very tricky case. Can you run the entire notebook with environment variable And one more question, is your installation of cuquantum-python based on pip, conda or our appliance container? |
Beta Was this translation helpful? Give feedback.
-
Sorry about the confusion. As file is too big, here is the onedrive link (Of my school) to the coredump file. |
Beta Was this translation helpful? Give feedback.
-
Here is the output from backtrace. #0 0x00007fca25c4ba17 in ?? () from /global/homes/s/sgkim/.conda/envs/Tatis/lib/libcublas.so.12
#1 0x00007fca25d4d447 in ?? () from /global/homes/s/sgkim/.conda/envs/Tatis/lib/libcublas.so.12
#2 0x00007fca25d4deb4 in ?? () from /global/homes/s/sgkim/.conda/envs/Tatis/lib/libcublas.so.12
#3 0x00007fca25afe459 in cublasDdot_v2 () from /global/homes/s/sgkim/.conda/envs/Tatis/lib/libcublas.so.12
#4 0x00007fca61142b62 in ?? () from /global/homes/s/sgkim/.conda/envs/Tatis/lib/libcutensornet.so.2
#5 0x00007fca611289fa in ?? () from /global/homes/s/sgkim/.conda/envs/Tatis/lib/libcutensornet.so.2
#6 0x00007fca6115d26d in ?? () from /global/homes/s/sgkim/.conda/envs/Tatis/lib/libcutensornet.so.2
#7 0x00007fca611615c5 in cutensornetGateSplit ()
from /global/homes/s/sgkim/.conda/envs/Tatis/lib/libcutensornet.so.2
#8 0x00007fcbf31c3cb8 in __pyx_f_9cuquantum_11cutensornet_9_internal_11cutensornet__cutensornetGateSplit(void*, void*, void const*, void*, void const*, void*, void const*, void*, void*, void*, void*, void*, cutensornetGateSplitAlgo_t, void*, cutensornetComputeType_t, void*, void*, CUstream_st*) ()
from /pscratch/sd/s/sgkim/skim_cuquantum/cuQuantum-24.03.0/python/cuquantum/cutensornet/_internal/cutensornet.cpython-39-x86_64-linux-gnu.so
#9 0x00007fcbf31e7f6c in __pyx_f_9cuquantum_11cutensornet_13cycutensornet_cutensornetGateSplit(void*, void*, void const*, void*, void const*, void*, void const*, void*, void*, void*, void*, void*, cutensornetGateSplitAlgo_t, void*, cutensornetComputeType_t, void*, void*, CUstream_st*) ()
from /pscratch/sd/s/sgkim/skim_cuquantum/cuQuantum-24.03.0/python/cuquantum/cutensornet/cycutensornet.cpython-39-x86_64-linux-gnu.so
#10 0x00007fcbf321f67a in __pyx_f_9cuquantum_11cutensornet_11cutensornet_gate_split(long, long, long, long, long, long, long, long, long, long, long, long, int, long, int, long, long, long, int) ()
from /pscratch/sd/s/sgkim/skim_cuquantum/cuQuantum-24.03.0/python/cuquantum/cutensornet/cutensornet.cpython-39-x86_64-linux-gnu.so
#11 0x00007fcbf323047b in __pyx_pw_9cuquantum_11cutensornet_11cutensornet_109gate_split(_object*, _object*, _object*) ()
from /pscratch/sd/s/sgkim/skim_cuquantum/cuQuantum-24.03.0/python/cuquantum/cutensornet/cutensornet.cpython-39-x86_64-linux-gnu.so
#12 0x00005602e486a6b6 in cfunction_call (func=0x7fcbf337a4f0, args=<optimized out>, kwargs=<optimized out>)
at /usr/local/src/conda/python-3.9.19/Objects/methodobject.c:543
#13 0x00005602e48537ac in _PyObject_MakeTpCall (tstate=0x5602e4acc8b0, callable=0x7fcbf337a4f0,
args=<optimized out>, nargs=<optimized out>, keywords=0x0)
at /usr/local/src/conda/python-3.9.19/Objects/call.c:191
#14 0x00005602e484ff10 in _PyObject_VectorcallTstate (kwnames=0x0, nargsf=<optimized out>, args=<optimized out>,
callable=0x7fcbf337a4f0, tstate=<optimized out>)
at /usr/local/src/conda/python-3.9.19/Include/cpython/abstract.h:116
#15 _PyObject_VectorcallTstate (kwnames=0x0, nargsf=<optimized out>, args=0x5602f64fa3e8,
callable=0x7fcbf337a4f0, tstate=<optimized out>)
at /usr/local/src/conda/python-3.9.19/Include/cpython/abstract.h:103
#16 PyObject_Vectorcall (kwnames=0x0, nargsf=<optimized out>, args=0x5602f64fa3e8, callable=0x7fcbf337a4f0)
at /usr/local/src/conda/python-3.9.19/Include/cpython/abstract.h:127
#17 call_function (kwnames=0x0, oparg=<optimized out>, pp_stack=<synthetic pointer>, tstate=0x5602e4acc8b0)
at /usr/local/src/conda/python-3.9.19/Python/ceval.c:5077
#18 _PyEval_EvalFrameDefault (tstate=<optimized out>, f=0x5602f64fa130, throwflag=<optimized out>)
at /usr/local/src/conda/python-3.9.19/Python/ceval.c:3489
#19 0x00005602e484a184 in _PyEval_EvalFrame (throwflag=0, f=0x5602f64fa130, tstate=0x5602e4acc8b0)
at /usr/local/src/conda/python-3.9.19/Include/internal/pycore_ceval.h:40
#20 _PyEval_EvalCode (tstate=0x5602e4acc8b0, _co=<optimized out>, globals=<optimized out>,
locals=<optimized out>, args=<optimized out>, argcount=<optimized out>, kwnames=0x0, kwargs=0x5602e81f9398,
kwcount=0, kwstep=1, defs=0x0, defcount=<optimized out>, kwdefs=0x0, closure=0x0, name=0x7fcbc881ff30,
qualname=0x7fcbc881ff30) at /usr/local/src/conda/python-3.9.19/Python/ceval.c:4329
#21 0x00005602e485b559 in _PyFunction_Vectorcall (func=<optimized out>, stack=<optimized out>,
nargsf=<optimized out>, kwnames=<optimized out>) at /usr/local/src/conda/python-3.9.19/Objects/call.c:396
#22 0x00005602e484b352 in _PyObject_VectorcallTstate (kwnames=0x0, nargsf=<optimized out>, args=0x5602e81f9350,
callable=0x7fcbc888fb80, tstate=0x5602e4acc8b0)
at /usr/local/src/conda/python-3.9.19/Include/cpython/abstract.h:118
#23 PyObject_Vectorcall (kwnames=0x0, nargsf=<optimized out>, args=0x5602e81f9350, callable=0x7fcbc888fb80)
at /usr/local/src/conda/python-3.9.19/Include/cpython/abstract.h:127
#24 call_function (kwnames=0x0, oparg=<optimized out>, pp_stack=<synthetic pointer>, tstate=0x5602e4acc8b0)
at /usr/local/src/conda/python-3.9.19/Python/ceval.c:5077
#25 _PyEval_EvalFrameDefault (tstate=<optimized out>, f=0x5602e81f90c0, throwflag=<optimized out>)
at /usr/local/src/conda/python-3.9.19/Python/ceval.c:3520
#26 0x00005602e484a184 in _PyEval_EvalFrame (throwflag=0, f=0x5602e81f90c0, tstate=0x5602e4acc8b0)
at /usr/local/src/conda/python-3.9.19/Include/internal/pycore_ceval.h:40
#27 _PyEval_EvalCode (tstate=0x5602e4acc8b0, _co=<optimized out>, globals=<optimized out>,
locals=<optimized out>, args=<optimized out>, argcount=<optimized out>, kwnames=0x7fcbc5e32098,
kwargs=0x7fcbd9fab418, kwcount=2, kwstep=1, defs=0x0, defcount=<optimized out>, kwdefs=0x7fcbc8829300,
closure=0x0, name=0x7fcbf7019580, qualname=0x7fcbf7019580)
at /usr/local/src/conda/python-3.9.19/Python/ceval.c:4329
#28 0x00005602e485b559 in _PyFunction_Vectorcall (func=<optimized out>, stack=<optimized out>,
nargsf=<optimized out>, kwnames=<optimized out>) at /usr/local/src/conda/python-3.9.19/Objects/call.c:396
#29 0x00005602e486917c in PyVectorcall_Call (kwargs=<optimized out>, tuple=<optimized out>,
callable=0x7fcbc88244c0) at /usr/local/src/conda/python-3.9.19/Objects/call.c:243
#30 _PyObject_Call (kwargs=<optimized out>, args=<optimized out>, callable=0x7fcbc88244c0,
tstate=<optimized out>) at /usr/local/src/conda/python-3.9.19/Objects/call.c:266
#31 PyObject_Call (callable=0x7fcbc88244c0, args=<optimized out>, kwargs=<optimized out>)
at /usr/local/src/conda/python-3.9.19/Objects/call.c:293
#32 0x00005602e484f516 in do_call_core (kwdict=0x7fcbc5e35180, callargs=0x7fcbc5e7c180, func=0x7fcbc88244c0,
tstate=<optimized out>) at /usr/local/src/conda/python-3.9.19/Python/ceval.c:5125
#33 _PyEval_EvalFrameDefault (tstate=<optimized out>, f=0x5602f64ed350, throwflag=<optimized out>)
at /usr/local/src/conda/python-3.9.19/Python/ceval.c:3582
#34 0x00005602e484a184 in _PyEval_EvalFrame (throwflag=0, f=0x5602f64ed350, tstate=0x5602e4acc8b0)
at /usr/local/src/conda/python-3.9.19/Include/internal/pycore_ceval.h:40
#35 _PyEval_EvalCode (tstate=0x5602e4acc8b0, _co=<optimized out>, globals=<optimized out>,
locals=<optimized out>, args=<optimized out>, argcount=<optimized out>, kwnames=0x7fcbf6d6edd8,
kwargs=0x5602e4b2ebe0, kwcount=2, kwstep=1, defs=0x7fcbf6d68658, defcount=<optimized out>, kwdefs=0x0,
closure=0x0, name=0x7fcbf6d568f0, qualname=0x7fcbf6d568f0)
at /usr/local/src/conda/python-3.9.19/Python/ceval.c:4329
#36 0x00005602e485b559 in _PyFunction_Vectorcall (func=<optimized out>, stack=<optimized out>,
nargsf=<optimized out>, kwnames=<optimized out>) at /usr/local/src/conda/python-3.9.19/Objects/call.c:396
#37 0x00005602e484c162 in _PyObject_VectorcallTstate (kwnames=0x7fcbf6d6edc0, nargsf=<optimized out>,
args=<optimized out>, callable=0x7fcbc5e7e820, tstate=0x5602e4acc8b0)
at /usr/local/src/conda/python-3.9.19/Include/cpython/abstract.h:118
#38 PyObject_Vectorcall (kwnames=0x7fcbf6d6edc0, nargsf=<optimized out>, args=<optimized out>,
callable=0x7fcbc5e7e820) at /usr/local/src/conda/python-3.9.19/Include/cpython/abstract.h:127
#39 call_function (kwnames=0x7fcbf6d6edc0, oparg=<optimized out>, pp_stack=<synthetic pointer>,
tstate=<optimized out>) at /usr/local/src/conda/python-3.9.19/Python/ceval.c:5077
#40 _PyEval_EvalFrameDefault (tstate=<optimized out>, f=0x5602e4b2ea50, throwflag=<optimized out>)
at /usr/local/src/conda/python-3.9.19/Python/ceval.c:3537
#41 0x00005602e484a184 in _PyEval_EvalFrame (throwflag=0, f=0x5602e4b2ea50, tstate=0x5602e4acc8b0)
at /usr/local/src/conda/python-3.9.19/Include/internal/pycore_ceval.h:40
#42 _PyEval_EvalCode (tstate=0x5602e4acc8b0, _co=<optimized out>, globals=<optimized out>,
locals=<optimized out>, args=<optimized out>, argcount=<optimized out>, kwnames=0x0, kwargs=0x0, kwcount=0,
kwstep=2, defs=0x0, defcount=<optimized out>, kwdefs=0x0, closure=0x0, name=0x0, qualname=0x0)
at /usr/local/src/conda/python-3.9.19/Python/ceval.c:4329
#43 0x00005602e4849e58 in _PyEval_EvalCodeWithName (_co=<optimized out>, globals=<optimized out>,
locals=<optimized out>, args=<optimized out>, argcount=<optimized out>, kwnames=<optimized out>, kwargs=0x0,
kwcount=0, kwstep=2, defs=0x0, defcount=0, kwdefs=0x0, closure=0x0, name=0x0, qualname=0x0)
at /usr/local/src/conda/python-3.9.19/Python/ceval.c:4361
#41 0x00005602e484a184 in _PyEval_EvalFrame (throwflag=0, f=0x5602e4b2ea50, tstate=0x5602e4acc8b0)
at /usr/local/src/conda/python-3.9.19/Include/internal/pycore_ceval.h:40
#42 _PyEval_EvalCode (tstate=0x5602e4acc8b0, _co=<optimized out>, globals=<optimized out>,
locals=<optimized out>, args=<optimized out>, argcount=<optimized out>, kwnames=0x0, kwargs=0x0, kwcount=0,
kwstep=2, defs=0x0, defcount=<optimized out>, kwdefs=0x0, closure=0x0, name=0x0, qualname=0x0)
at /usr/local/src/conda/python-3.9.19/Python/ceval.c:4329
#43 0x00005602e4849e58 in _PyEval_EvalCodeWithName (_co=<optimized out>, globals=<optimized out>,
locals=<optimized out>, args=<optimized out>, argcount=<optimized out>, kwnames=<optimized out>, kwargs=0x0,
kwcount=0, kwstep=2, defs=0x0, defcount=0, kwdefs=0x0, closure=0x0, name=0x0, qualname=0x0)
at /usr/local/src/conda/python-3.9.19/Python/ceval.c:4361
--Type <RET> for more, q to quit, c to continue without paging--
#44 0x00005602e4849e09 in PyEval_EvalCodeEx (_co=<optimized out>, globals=<optimized out>,
locals=<optimized out>, args=<optimized out>, argcount=<optimized out>, kws=<optimized out>, kwcount=0,
defs=0x0, defcount=0, kwdefs=0x0, closure=0x0) at /usr/local/src/conda/python-3.9.19/Python/ceval.c:4377
#45 0x00005602e48f74ab in PyEval_EvalCode (co=co@entry=0x7fcbf6d69710, globals=globals@entry=0x7fcbf70e3ac0,
locals=locals@entry=0x7fcbf70e3ac0) at /usr/local/src/conda/python-3.9.19/Python/ceval.c:828
#46 0x00005602e492487a in run_eval_code_obj (tstate=0x5602e4acc8b0, co=0x7fcbf6d69710, globals=0x7fcbf70e3ac0,
locals=0x7fcbf70e3ac0) at /usr/local/src/conda/python-3.9.19/Python/pythonrun.c:1221
#47 0x00005602e4920c03 in run_mod (mod=<optimized out>, filename=<optimized out>, globals=0x7fcbf70e3ac0,
locals=0x7fcbf70e3ac0, flags=<optimized out>, arena=<optimized out>)
at /usr/local/src/conda/python-3.9.19/Python/pythonrun.c:1242
#48 0x00005602e47b4175 in pyrun_file (fp=0x5602e4b51b80, filename=0x7fcbf7026810, start=<optimized out>,
globals=0x7fcbf70e3ac0, locals=0x7fcbf70e3ac0, closeit=1, flags=0x7fffc6dbe7f8)
at /usr/local/src/conda/python-3.9.19/Python/pythonrun.c:1140
#49 0x00005602e491a841 in pyrun_simple_file (flags=0x7fffc6dbe7f8, closeit=1, filename=0x7fcbf7026810,
fp=0x5602e4b51b80) at /usr/local/src/conda/python-3.9.19/Python/pythonrun.c:450
#50 PyRun_SimpleFileExFlags (fp=0x5602e4b51b80, filename=<optimized out>, closeit=1, flags=0x7fffc6dbe7f8)
at /usr/local/src/conda/python-3.9.19/Python/pythonrun.c:483
#51 0x00005602e4917c6d in pymain_run_file (cf=0x7fffc6dbe7f8, config=0x5602e4acd190)
at /usr/local/src/conda/python-3.9.19/Modules/main.c:377
#52 pymain_run_python (exitcode=0x7fffc6dbe7f0) at /usr/local/src/conda/python-3.9.19/Modules/main.c:602
#53 Py_RunMain () at /usr/local/src/conda/python-3.9.19/Modules/main.c:681
#54 0x00005602e48eb2e7 in Py_BytesMain (argc=<optimized out>, argv=<optimized out>)
at /usr/local/src/conda/python-3.9.19/Modules/main.c:1101
#55 0x00007fcbf723f24d in __libc_start_main () from /lib64/libc.so.6
#56 0x00005602e48eb1e1 in _start () |
Beta Was this translation helpful? Give feedback.
I assume that nvidia 22.2 refers to the 22.2 SDK which contains the entire toolkit but only for CUDA 11. Perhaps that module is somehow interfering with the cuda12.5 that you got from conda installation of cuquantum-python. In any case, I'm glad that it's resolved.