How to avoid this issue? It appears that it is related to the type of tensor. Does it mean the tensor is float64 instead of float32?
Below is the stack trace.
File “/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/runpy.py”, line 194, in _run_module_as_main
return _run_code(code, main_globals, None,
File “/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/runpy.py”, line 87, in _run_code
exec(code, run_globals)
File “/home/csgrad/mbhosale/.vscode-server/extensions/ms-python.python-2023.4.1/pythonFiles/lib/python/debugpy/adapter/…/…/debugpy/launcher/…/…/debugpy/main.py”, line 39, in
cli.main()
File “/home/csgrad/mbhosale/.vscode-server/extensions/ms-python.python-2023.4.1/pythonFiles/lib/python/debugpy/adapter/…/…/debugpy/launcher/…/…/debugpy/…/debugpy/server/cli.py”, line 430, in main
run()
File “/home/csgrad/mbhosale/.vscode-server/extensions/ms-python.python-2023.4.1/pythonFiles/lib/python/debugpy/adapter/…/…/debugpy/launcher/…/…/debugpy/…/debugpy/server/cli.py”, line 284, in run_file
runpy.run_path(target, run_name=“main”)
File “/home/csgrad/mbhosale/.vscode-server/extensions/ms-python.python-2023.4.1/pythonFiles/lib/python/debugpy/_vendored/pydevd/_pydevd_bundle/pydevd_runpy.py”, line 321, in run_path
return _run_module_code(code, init_globals, run_name,
File “/home/csgrad/mbhosale/.vscode-server/extensions/ms-python.python-2023.4.1/pythonFiles/lib/python/debugpy/_vendored/pydevd/_pydevd_bundle/pydevd_runpy.py”, line 135, in _run_module_code
_run_code(code, mod_globals, init_globals,
File “/home/csgrad/mbhosale/.vscode-server/extensions/ms-python.python-2023.4.1/pythonFiles/lib/python/debugpy/_vendored/pydevd/_pydevd_bundle/pydevd_runpy.py”, line 124, in _run_code
exec(code, run_globals)
File “/home/csgrad/mbhosale/Image_registration/registration_copy/registration/mainvm.py”, line 250, in
mp.spawn(run_parallel,
File “/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/site-packages/torch/multiprocessing/spawn.py”, line 240, in spawn
return start_processes(fn, args, nprocs, join, daemon, start_method=‘spawn’)
File “/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/site-packages/torch/multiprocessing/spawn.py”, line 198, in start_processes
while not context.join():
File “/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/site-packages/torch/multiprocessing/spawn.py”, line 160, in join
raise ProcessRaisedException(msg, error_index, failed_process.pid)
torch.multiprocessing.spawn.ProcessRaisedException:– Process 1 terminated with the following error:
Traceback (most recent call last):
File “/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/site-packages/torch/multiprocessing/spawn.py”, line 69, in _wrap
fn(i, *args)
File “/home/csgrad/mbhosale/Image_registration/registration_copy/registration/mainvm.py”, line 132, in run_parallel
train.run()
File “/home/csgrad/mbhosale/Image_registration/registration_copy/registration/train.py”, line 210, in run
self.train_epoch(optimizer, scheduler, epoch)
File “/home/csgrad/mbhosale/Image_registration/registration_copy/registration/train.py”, line 107, in train_epoch
loss, trdice = self.trainIter(fixed, moving, fixed_label, moving_label, fixed_nopad=fixed_nopad)
File “/home/csgrad/mbhosale/Image_registration/registration_copy/registration/train.py”, line 34, in trainIter
sim_loss, grad_loss, seg_loss, dice = self.model.forward(fix, moving,
File “/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/site-packages/torch/nn/parallel/distributed.py”, line 1008, in forward
output = self._run_ddp_forward(*inputs, **kwargs)
File “/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/site-packages/torch/nn/parallel/distributed.py”, line 969, in _run_ddp_forward
return module_to_run(*inputs[0], **kwargs[0])
File “/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/site-packages/torch/nn/modules/module.py”, line 1130, in _call_impl
return forward_call(*input, **kwargs)
File “/home/csgrad/mbhosale/Image_registration/registration_copy/registration/models.py”, line 191, in forward
unet_out = self.unet(x)
File “/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/site-packages/torch/nn/modules/module.py”, line 1130, in _call_impl
return forward_call(*input, **kwargs)
File “/home/csgrad/mbhosale/Image_registration/registration_copy/registration/models.py”, line 149, in forward
y = self.upsample(y)
File “/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/site-packages/torch/nn/modules/module.py”, line 1130, in _call_impl
return forward_call(*input, **kwargs)
File “/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/site-packages/torch/nn/modules/upsampling.py”, line 153, in forward
return F.interpolate(input, self.size, self.scale_factor, self.mode, self.align_corners,
File “/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/site-packages/torch/nn/functional.py”, line 3912, in interpolate
return torch._C._nn.upsample_nearest3d(input, output_size, scale_factors)
RuntimeError: Expected output.numel() <= std::numeric_limits<int32_t>::max() to be true, but got false. (Could this error message be improved? If so, please report an enhancement request to PyTorch.)/home/csgrad/mbhosale/anaconda3/envs/registration/lib/python3.8/multiprocessing/resource_tracker.py:216: UserWarning: resource_tracker: There appear to be 26 leaked semaphore objects to clean up at shutdown
warnings.warn('resource_tracker: There appear to be %d ’