Hi All,
Have a weird bug occurring. On torch 1.5.1, training my network on CPU works perfectly fine. However, when upgrading to torch 1.6.0, CPU training fails. Below is the gdb
stack trace:
free(): invalid next size (normal)
Thread 1 "python" received signal SIGABRT, Aborted.
__GI_raise (sig=sig@entry=6) at ../sysdeps/unix/sysv/linux/raise.c:51
51 ../sysdeps/unix/sysv/linux/raise.c: No such file or directory.
(gdb) bt
#0 __GI_raise (sig=sig@entry=6) at ../sysdeps/unix/sysv/linux/raise.c:51
#1 0x00007ffff7805801 in __GI_abort () at abort.c:79
#2 0x00007ffff784e897 in __libc_message (action=action@entry=do_abort, fmt=fmt@entry=0x7ffff797bb9a "%s\n") at ../sysdeps/posix/libc_fatal.c:181
#3 0x00007ffff785590a in malloc_printerr (str=str@entry=0x7ffff797d8b8 "free(): invalid next size (normal)") at malloc.c:5350
#4 0x00007ffff785d0ad in _int_free (have_lock=0, p=0x555586de8db0, av=0x7ffff7bb0c40 <main_arena>) at malloc.c:4286
#5 __GI___libc_free (mem=0x555586de8dc0) at malloc.c:3124
#6 0x00007fff33ac9203 in _ZNSt17_Function_handlerIFvPvEUlS0_E0_E9_M_invokeERKSt9_Any_dataOS0_ () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#7 0x00007fff33ab7333 in std::_Sp_counted_deleter<void*, std::function<void (void*)>, std::allocator<void>, (__gnu_cxx::_Lock_policy)2>::_M_dispose() ()
from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#8 0x00007fff33ad18da in at::native::IntrusivePtrTargetWrapper<ideep::tensor>::~IntrusivePtrTargetWrapper() () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#9 0x00007fff3347a1b9 in c10::intrusive_ptr<c10::TensorImpl, c10::UndefinedTensorImpl>::reset_() () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#10 0x00007fff33abfd6b in at::native::mkldnn_convolution_backward_weights(c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#11 0x00007fff33cc263e in at::TypeDefault::mkldnn_convolution_backward_weights(c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#12 0x00007fff33cf0266 in c10::impl::wrap_kernel_functor_unboxed_<c10::impl::detail::WrapFunctionIntoRuntimeFunctor_<std::tuple<at::Tensor, at::Tensor> (*)(c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool), std::tuple<at::Tensor, at::Tensor>, c10::guts::typelist::typelist<c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool> >, std::tuple<at::Tensor, at::Tensor> (c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool)>::call(c10::OperatorKernel*, c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#13 0x00007fff33c2aeaf in at::mkldnn_convolution_backward_weights(c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool)
() from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#14 0x00007fff33abf8fb in at::native::mkldnn_convolution_backward(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#15 0x00007fff33cc271a in at::TypeDefault::mkldnn_convolution_backward(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#16 0x00007fff33cf02bc in c10::impl::wrap_kernel_functor_unboxed_<c10::impl::detail::WrapFunctionIntoRuntimeFunctor_<std::tuple<at::Tensor, at::Tensor, at::Tensor> (*)(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>), std::tuple<at::Tensor, at::Tensor, at::Tensor>, c10::guts::typelist::typelist<at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul> > >, std::tuple<at::Tensor, at::Tensor, at::Tensor> (at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>)>::call(c10::OperatorKernel*, at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#17 0x00007fff33c2e4bb in at::mkldnn_convolution_backward(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#18 0x00007fff3587c632 in torch::autograd::VariableType::mkldnn_convolution_backward(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#19 0x00007fff33cf02bc in c10::impl::wrap_kernel_functor_unboxed_<c10::impl::detail::WrapFunctionIntoRuntimeFunctor_<std::tuple<at::Tensor, at::Tensor, at::Tensor> (*)(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>), std::tuple<at::Tensor, at::Tensor, at::Tensor>, c10::guts::typelist::typelist<at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul> > >, std::tuple<at::Tensor, at::Tensor, at::Tensor> (at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>)>::call(c10::OperatorKernel*, at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#20 0x00007fff33c2e4bb in at::mkldnn_convolution_backward(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
---Type <return> to continue, or q <return> to quit---
#21 0x00007fff35782f93 in torch::autograd::generated::MkldnnConvolutionBackward::apply(std::vector<at::Tensor, std::allocator<at::Tensor> >&&) ()
from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#22 0x00007fff35da1017 in torch::autograd::Node::operator()(std::vector<at::Tensor, std::allocator<at::Tensor> >&&) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#23 0x00007fff35d9c860 in torch::autograd::Engine::evaluate_function(std::shared_ptr<torch::autograd::GraphTask>&, torch::autograd::Node*, torch::autograd::InputBuffer&, std::shared_ptr<torch::autograd::ReadyQueue> const&) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#24 0x00007fff35d9d401 in torch::autograd::Engine::thread_main(std::shared_ptr<torch::autograd::GraphTask> const&) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#25 0x00007fff35d9ab1c in torch::autograd::Engine::execute_with_graph_task(std::shared_ptr<torch::autograd::GraphTask> const&, std::shared_ptr<torch::autograd::Node>) ()
from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#26 0x00007fff39cbadcc in torch::autograd::python::PythonEngine::execute_with_graph_task(std::shared_ptr<torch::autograd::GraphTask> const&, std::shared_ptr<torch::autograd::Node>) ()
from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_python.so
#27 0x00007fff35d99e53 in torch::autograd::Engine::execute(std::vector<torch::autograd::Edge, std::allocator<torch::autograd::Edge> > const&, std::vector<at::Tensor, std::allocator<at::Tensor> > const&, bool, bool, std::vector<torch::autograd::Edge, std::allocator<torch::autograd::Edge> > const&) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#28 0x00007fff39cbabbe in torch::autograd::python::PythonEngine::execute(std::vector<torch::autograd::Edge, std::allocator<torch::autograd::Edge> > const&, std::vector<at::Tensor, std::allocator<at::Tensor> > const&, bool, bool, std::vector<torch::autograd::Edge, std::allocator<torch::autograd::Edge> > const&) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_python.so
#29 0x00007fff39cbb889 in THPEngine_run_backward(THPEngine*, _object*, _object*) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_python.so
#30 0x00005555556b87e6 in _PyMethodDef_RawFastCallKeywords () at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:694
#31 0x00005555556b8861 in _PyCFunction_FastCallKeywords (func=0x7ffe2c19b2d0, args=<optimized out>, nargs=<optimized out>, kwnames=<optimized out>)
at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:734
#32 0x00005555557247cc in call_function (kwnames=0x7fffedb0ead0, oparg=<optimized out>, pp_stack=<synthetic pointer>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:4568
#33 _PyEval_EvalFrameDefault () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3139
#34 0x0000555555668539 in _PyEval_EvalCodeWithName () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3930
#35 0x00005555556b7ef5 in _PyFunction_FastCallKeywords () at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:433
#36 0x0000555555723f29 in call_function (kwnames=0x0, oparg=<optimized out>, pp_stack=<synthetic pointer>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:4616
#37 _PyEval_EvalFrameDefault () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3093
#38 0x0000555555668539 in _PyEval_EvalCodeWithName () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3930
#39 0x00005555556b7ef5 in _PyFunction_FastCallKeywords () at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:433
#40 0x000055555571fa93 in call_function (kwnames=0x0, oparg=<optimized out>, pp_stack=<synthetic pointer>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:4616
#41 _PyEval_EvalFrameDefault () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3110
#42 0x00005555556b7ccb in function_code_fastcall (globals=<optimized out>, nargs=1, args=<optimized out>, co=<optimized out>) at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:283
#43 _PyFunction_FastCallKeywords () at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:408
#44 0x000055555571fa93 in call_function (kwnames=0x0, oparg=<optimized out>, pp_stack=<synthetic pointer>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:4616
#45 _PyEval_EvalFrameDefault () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3110
#46 0x00005555556b7ccb in function_code_fastcall (globals=<optimized out>, nargs=3, args=<optimized out>, co=<optimized out>) at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:283
#47 _PyFunction_FastCallKeywords () at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:408
#48 0x000055555571f806 in call_function (kwnames=0x0, oparg=<optimized out>, pp_stack=<synthetic pointer>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:4616
#49 _PyEval_EvalFrameDefault () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3124
#50 0x0000555555668539 in _PyEval_EvalCodeWithName () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3930
#51 0x00005555556b7ef5 in _PyFunction_FastCallKeywords () at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:433
#52 0x000055555571f806 in call_function (kwnames=0x0, oparg=<optimized out>, pp_stack=<synthetic pointer>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:4616
#53 _PyEval_EvalFrameDefault () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3124
#54 0x0000555555668539 in _PyEval_EvalCodeWithName () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3930
#55 0x0000555555669424 in PyEval_EvalCodeEx () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3959
---Type <return> to continue, or q <return> to quit---
#56 0x000055555566944c in PyEval_EvalCode (co=<optimized out>, globals=<optimized out>, locals=<optimized out>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:524
#57 0x000055555577eb74 in run_mod () at /tmp/build/80754af9/python_1565725737370/work/Python/pythonrun.c:1035
#58 0x0000555555788eb1 in PyRun_FileExFlags () at /tmp/build/80754af9/python_1565725737370/work/Python/pythonrun.c:988
#59 0x00005555557890a3 in PyRun_SimpleFileExFlags () at /tmp/build/80754af9/python_1565725737370/work/Python/pythonrun.c:429
#60 0x000055555578a195 in pymain_run_file (p_cf=0x7fffffffe110, filename=0x5555558c0900 L"train.py", fp=0x5555559090e0) at /tmp/build/80754af9/python_1565725737370/work/Modules/main.c:433
#61 pymain_run_filename (cf=0x7fffffffe110, pymain=0x7fffffffe220) at /tmp/build/80754af9/python_1565725737370/work/Modules/main.c:1612
#62 pymain_run_python (pymain=0x7fffffffe220) at /tmp/build/80754af9/python_1565725737370/work/Modules/main.c:2873
#63 pymain_main () at /tmp/build/80754af9/python_1565725737370/work/Modules/main.c:3413
#64 0x000055555578a2bc in _Py_UnixMain () at /tmp/build/80754af9/python_1565725737370/work/Modules/main.c:3448
#65 0x00007ffff77e6b97 in __libc_start_main (main=0x5555556496c0 <main>, argc=6, argv=0x7fffffffe378, init=<optimized out>, fini=<optimized out>, rtld_fini=<optimized out>, stack_end=0x7fffffffe368)
at ../csu/libc-start.c:310
#66 0x000055555572f062 in _start () at ../sysdeps/x86_64/elf/start.S:103
Running my training script in another gdb session yields a corrupted double-linked list
error, though the stack trace points to the same spot:
corrupted double-linked list
Thread 1 "python" received signal SIGABRT, Aborted.
__GI_raise (sig=sig@entry=6) at ../sysdeps/unix/sysv/linux/raise.c:51
51 ../sysdeps/unix/sysv/linux/raise.c: No such file or directory.
(gdb) bt
#0 __GI_raise (sig=sig@entry=6) at ../sysdeps/unix/sysv/linux/raise.c:51
#1 0x00007ffff7805801 in __GI_abort () at abort.c:79
#2 0x00007ffff784e897 in __libc_message (action=action@entry=do_abort, fmt=fmt@entry=0x7ffff797bb9a "%s\n") at ../sysdeps/posix/libc_fatal.c:181
#3 0x00007ffff785590a in malloc_printerr (str=str@entry=0x7ffff7979cba "corrupted double-linked list") at malloc.c:5350
#4 0x00007ffff7855ac4 in malloc_consolidate (av=av@entry=0x7ffff7bb0c40 <main_arena>) at malloc.c:4456
#5 0x00007ffff785d03b in _int_free (have_lock=0, p=<optimized out>, av=0x7ffff7bb0c40 <main_arena>) at malloc.c:4362
#6 __GI___libc_free (mem=0x5555c0ecf480) at malloc.c:3124
#7 0x00007fff33ac9203 in _ZNSt17_Function_handlerIFvPvEUlS0_E0_E9_M_invokeERKSt9_Any_dataOS0_ () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#8 0x00007fff33ab7333 in std::_Sp_counted_deleter<void*, std::function<void (void*)>, std::allocator<void>, (__gnu_cxx::_Lock_policy)2>::_M_dispose() ()
from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#9 0x00007fff33ab81fa in ideep::tensor::~tensor() () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#10 0x00007fff33ac4045 in void ideep::convolution_backward_weights::compute_impl<true>(ideep::tensor const&, ideep::tensor const&, std::vector<long, std::allocator<long> > const&, ideep::tensor&, ideep::tensor&, std::vector<long, std::allocator<long> > const&, std::vector<long, std::allocator<long> > const&, std::vector<long, std::allocator<long> > const&, std::vector<long, std::allocator<long> > const&, int, dnnl::memory::data_type, dnnl::algorithm, ideep::engine const&) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#11 0x00007fff33abfc6f in at::native::mkldnn_convolution_backward_weights(c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#12 0x00007fff33cc263e in at::TypeDefault::mkldnn_convolution_backward_weights(c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#13 0x00007fff33cf0266 in c10::impl::wrap_kernel_functor_unboxed_<c10::impl::detail::WrapFunctionIntoRuntimeFunctor_<std::tuple<at::Tensor, at::Tensor> (*)(c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool), std::tuple<at::Tensor, at::Tensor>, c10::guts::typelist::typelist<c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool> >, std::tuple<at::Tensor, at::Tensor> (c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool)>::call(c10::OperatorKernel*, c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#14 0x00007fff33c2aeaf in at::mkldnn_convolution_backward_weights(c10::ArrayRef<long>, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, bool)
() from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#15 0x00007fff33abf8fb in at::native::mkldnn_convolution_backward(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#16 0x00007fff33cc271a in at::TypeDefault::mkldnn_convolution_backward(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#17 0x00007fff33cf02bc in c10::impl::wrap_kernel_functor_unboxed_<c10::impl::detail::WrapFunctionIntoRuntimeFunctor_<std::tuple<at::Tensor, at::Tensor, at::Tensor> (*)(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>), std::tuple<at::Tensor, at::Tensor, at::Tensor>, c10::guts::typelist::typelist<at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul> > >, std::tuple<at::Tensor, at::Tensor, at::Tensor> (at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>)>::call(c10::OperatorKernel*, at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#18 0x00007fff33c2e4bb in at::mkldnn_convolution_backward(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#19 0x00007fff3587c632 in torch::autograd::VariableType::mkldnn_convolution_backward(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#20 0x00007fff33cf02bc in c10::impl::wrap_kernel_functor_unboxed_<c10::impl::detail::WrapFunctionIntoRuntimeFunctor_<std::tuple<at::Tensor, at::Tensor, at::Tensor> (*)(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>), std::tuple<at::Tensor, at::Tensor, at::Tensor>, c10::guts::typelist::typelist<at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul> > >, std::tuple<at::Tensor, at::Tensor, at::Tensor> (at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>)>::call(c10::OperatorKernel*, at::Tensor const&, at::Tensor con---Type <return> to continue, or q <return> to quit---
st&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#21 0x00007fff33c2e4bb in at::mkldnn_convolution_backward(at::Tensor const&, at::Tensor const&, at::Tensor const&, c10::ArrayRef<long>, c10::ArrayRef<long>, c10::ArrayRef<long>, long, std::array<bool, 3ul>) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#22 0x00007fff35782f93 in torch::autograd::generated::MkldnnConvolutionBackward::apply(std::vector<at::Tensor, std::allocator<at::Tensor> >&&) ()
from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#23 0x00007fff35da1017 in torch::autograd::Node::operator()(std::vector<at::Tensor, std::allocator<at::Tensor> >&&) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#24 0x00007fff35d9c860 in torch::autograd::Engine::evaluate_function(std::shared_ptr<torch::autograd::GraphTask>&, torch::autograd::Node*, torch::autograd::InputBuffer&, std::shared_ptr<torch::autograd::ReadyQueue> const&) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#25 0x00007fff35d9d401 in torch::autograd::Engine::thread_main(std::shared_ptr<torch::autograd::GraphTask> const&) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#26 0x00007fff35d9ab1c in torch::autograd::Engine::execute_with_graph_task(std::shared_ptr<torch::autograd::GraphTask> const&, std::shared_ptr<torch::autograd::Node>) ()
from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#27 0x00007fff39cbadcc in torch::autograd::python::PythonEngine::execute_with_graph_task(std::shared_ptr<torch::autograd::GraphTask> const&, std::shared_ptr<torch::autograd::Node>) ()
from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_python.so
#28 0x00007fff35d99e53 in torch::autograd::Engine::execute(std::vector<torch::autograd::Edge, std::allocator<torch::autograd::Edge> > const&, std::vector<at::Tensor, std::allocator<at::Tensor> > const&, bool, bool, std::vector<torch::autograd::Edge, std::allocator<torch::autograd::Edge> > const&) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_cpu.so
#29 0x00007fff39cbabbe in torch::autograd::python::PythonEngine::execute(std::vector<torch::autograd::Edge, std::allocator<torch::autograd::Edge> > const&, std::vector<at::Tensor, std::allocator<at::Tensor> > const&, bool, bool, std::vector<torch::autograd::Edge, std::allocator<torch::autograd::Edge> > const&) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_python.so
#30 0x00007fff39cbb889 in THPEngine_run_backward(THPEngine*, _object*, _object*) () from /home/kevin/anaconda3/lib/python3.7/site-packages/torch/lib/libtorch_python.so
#31 0x00005555556b87e6 in _PyMethodDef_RawFastCallKeywords () at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:694
#32 0x00005555556b8861 in _PyCFunction_FastCallKeywords (func=0x7ffe2c1827d0, args=<optimized out>, nargs=<optimized out>, kwnames=<optimized out>)
at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:734
#33 0x00005555557247cc in call_function (kwnames=0x7fffeb61cbd0, oparg=<optimized out>, pp_stack=<synthetic pointer>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:4568
#34 _PyEval_EvalFrameDefault () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3139
#35 0x0000555555668539 in _PyEval_EvalCodeWithName () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3930
#36 0x00005555556b7ef5 in _PyFunction_FastCallKeywords () at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:433
#37 0x0000555555723f29 in call_function (kwnames=0x0, oparg=<optimized out>, pp_stack=<synthetic pointer>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:4616
#38 _PyEval_EvalFrameDefault () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3093
#39 0x0000555555668539 in _PyEval_EvalCodeWithName () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3930
#40 0x00005555556b7ef5 in _PyFunction_FastCallKeywords () at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:433
#41 0x000055555571fa93 in call_function (kwnames=0x0, oparg=<optimized out>, pp_stack=<synthetic pointer>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:4616
#42 _PyEval_EvalFrameDefault () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3110
#43 0x00005555556b7ccb in function_code_fastcall (globals=<optimized out>, nargs=1, args=<optimized out>, co=<optimized out>) at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:283
#44 _PyFunction_FastCallKeywords () at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:408
#45 0x000055555571fa93 in call_function (kwnames=0x0, oparg=<optimized out>, pp_stack=<synthetic pointer>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:4616
#46 _PyEval_EvalFrameDefault () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3110
#47 0x00005555556b7ccb in function_code_fastcall (globals=<optimized out>, nargs=3, args=<optimized out>, co=<optimized out>) at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:283
#48 _PyFunction_FastCallKeywords () at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:408
#49 0x000055555571f806 in call_function (kwnames=0x0, oparg=<optimized out>, pp_stack=<synthetic pointer>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:4616
#50 _PyEval_EvalFrameDefault () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3124
#51 0x0000555555668539 in _PyEval_EvalCodeWithName () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3930
#52 0x00005555556b7ef5 in _PyFunction_FastCallKeywords () at /tmp/build/80754af9/python_1565725737370/work/Objects/call.c:433
#53 0x000055555571f806 in call_function (kwnames=0x0, oparg=<optimized out>, pp_stack=<synthetic pointer>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:4616
---Type <return> to continue, or q <return> to quit---
#54 _PyEval_EvalFrameDefault () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3124
#55 0x0000555555668539 in _PyEval_EvalCodeWithName () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3930
#56 0x0000555555669424 in PyEval_EvalCodeEx () at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:3959
#57 0x000055555566944c in PyEval_EvalCode (co=<optimized out>, globals=<optimized out>, locals=<optimized out>) at /tmp/build/80754af9/python_1565725737370/work/Python/ceval.c:524
#58 0x000055555577eb74 in run_mod () at /tmp/build/80754af9/python_1565725737370/work/Python/pythonrun.c:1035
#59 0x0000555555788eb1 in PyRun_FileExFlags () at /tmp/build/80754af9/python_1565725737370/work/Python/pythonrun.c:988
#60 0x00005555557890a3 in PyRun_SimpleFileExFlags () at /tmp/build/80754af9/python_1565725737370/work/Python/pythonrun.c:429
#61 0x000055555578a195 in pymain_run_file (p_cf=0x7fffffffe110, filename=0x5555558c0900 L"train.py", fp=0x5555559090e0) at /tmp/build/80754af9/python_1565725737370/work/Modules/main.c:433
#62 pymain_run_filename (cf=0x7fffffffe110, pymain=0x7fffffffe220) at /tmp/build/80754af9/python_1565725737370/work/Modules/main.c:1612
#63 pymain_run_python (pymain=0x7fffffffe220) at /tmp/build/80754af9/python_1565725737370/work/Modules/main.c:2873
#64 pymain_main () at /tmp/build/80754af9/python_1565725737370/work/Modules/main.c:3413
#65 0x000055555578a2bc in _Py_UnixMain () at /tmp/build/80754af9/python_1565725737370/work/Modules/main.c:3448
#66 0x00007ffff77e6b97 in __libc_start_main (main=0x5555556496c0 <main>, argc=6, argv=0x7fffffffe378, init=<optimized out>, fini=<optimized out>, rtld_fini=<optimized out>, stack_end=0x7fffffffe368)
at ../csu/libc-start.c:310
#67 0x000055555572f062 in _start () at ../sysdeps/x86_64/elf/start.S:103
Let me know if there is any other information I can provide that would be helpful, thanks!