One of the variables needed for gradient computation has been modified by an inplace operation

drdlfy · January 20, 2018, 2:09pm

RuntimeError: one of the variables needed for gradient computation has been modified by an inplace operation

This error occurs when running, do not know how else, thank you for your help.

jpeg729 · January 20, 2018, 3:52pm

The solution (obviously) is to replace the inplace operation with an op that doesn’t modify the data in place.

More than that I can’t say without seeing any code.

drdlfy · January 21, 2018, 4:50am

I code a little more, it can not be located where the error, so I can not get you to see the code, but still, thank you very much

drdlfy · January 21, 2018, 6:08am

import torch.nn as nn
import torchvision.models as models
from torch.nn import functional as F

class ResidualConvUnit(nn.Module):

def __init__(self, features):
    super(ResidualConvUnit,self).__init__()

    self.conv1 = nn.Conv2d(
        features, features, kernel_size=3, stride=1, padding=1, bias=True)
    self.conv2 = nn.Conv2d(
        features, features, kernel_size=3, stride=1, padding=1, bias=False)
    self.relu = nn.ReLU(inplace=True)

def forward(self, x):

    out = self.relu(x)
    out = self.conv1(out)
    out = self.relu(out)
    out = self.conv2(out)

    return out + x

class MultiResolutionFusion(nn.Module):

def __init__(self, out_feats, *shapes):
    super(MultiResolutionFusion,self).__init__()

    _, max_size = max(shapes, key=lambda x: x[1])

    for i, shape in enumerate(shapes):
        feat, size = shape
        if max_size % size != 0:
            raise ValueError("max_size not divisble by shape {}".format(i))

        scale_factor = max_size // size
        if scale_factor != 1:
            self.add_module("resolve{}".format(i), nn.Sequential(
                nn.Conv2d(feat, out_feats, kernel_size=3,
                          stride=1, padding=1, bias=False),
                nn.Upsample(scale_factor=scale_factor, mode='bilinear')
            ))
        else:
            self.add_module(
                "resolve{}".format(i),
                nn.Conv2d(feat, out_feats, kernel_size=3,
                          stride=1, padding=1, bias=False)
            )

def forward(self, *xs):

    output = self.resolve0(xs[0])

    for i, x in enumerate(xs[1:], 1):
        output = output + self.__getattr__("resolve{}".format(i))(x)

    return output

class ChainedResidualPool(nn.Module):

def __init__(self, feats):
    super(ChainedResidualPool,self).__init__()

    self.relu = nn.ReLU(inplace=True)
    for i in range(1, 4):
        self.add_module("block{}".format(i), nn.Sequential(
            nn.MaxPool2d(kernel_size=5, stride=1, padding=2),
            nn.Conv2d(feats, feats, kernel_size=3, stride=1, padding=1, bias=False)
        ))

def forward(self, x):
    x = self.relu(x)
    path = x

    for i in range(1, 4):
        path = self.__getattr__("block{}".format(i))(path)
        x = x + path

    return x

class ChainedResidualPoolImproved(nn.Module):

def __init__(self, feats):
    super(ChainedResidualPoolImproved,self).__init__()

    self.relu = nn.ReLU(inplace=True)
    for i in range(1, 5):
        self.add_module("block{}".format(i), nn.Sequential(
            nn.Conv2d(feats, feats, kernel_size=3, stride=1, padding=1, bias=False),
            nn.MaxPool2d(kernel_size=5, stride=1, padding=2)
        ))

def forward(self, x):
    x = self.relu(x)
    path = x

    for i in range(1, 5):
        path = self.__getattr__("block{}".format(i))(path)
        x = x + path

    return x

class BaseRefineNetBlock(nn.Module):

def __init__(self, features,
             residual_conv_unit,
             multi_resolution_fusion,
             chained_residual_pool, *shapes):
    super(BaseRefineNetBlock,self).__init__()
    print shapes
    for i, shape in enumerate(shapes):
        feats = shape[0]
        self.add_module("rcu{}".format(i), nn.Sequential(
            residual_conv_unit(feats),
            residual_conv_unit(feats)
        ))

    if len(shapes) != 1:
        self.mrf = multi_resolution_fusion(features, *shapes)
    else:
        self.mrf = None

    self.crp = chained_residual_pool(features)
    self.output_conv = residual_conv_unit(features)

def forward(self, *xs):
    for i, x in enumerate(xs):
        x = self.__getattr__("rcu{}".format(i))(x)

    if self.mrf is not None:
        out = self.mrf(*xs)
    else:
        out = xs[0]

    out = self.crp(out)
    return self.output_conv(out)

class RefineNetBlock(BaseRefineNetBlock):

def __init__(self, features, *shapes):
    super(RefineNetBlock,self).__init__(features, ResidualConvUnit,
                     MultiResolutionFusion,
                     ChainedResidualPool, *shapes)

class BaseRefineNet4Cascade(nn.Module):

def __init__(self, input_shape,
             refinenet_block,
             num_classes=2,
             features=256,
             resnet_factory=models.resnet101,
             pretrained=True,
             freeze_resnet=False):
    """Multi-path 4-Cascaded RefineNet for image segmentation

    Args:
        input_shape ((int, int)): (channel, size) assumes input has
            equal height and width
        refinenet_block (block): RefineNet Block
        num_classes (int, optional): number of classes
        features (int, optional): number of features in refinenet
        resnet_factory (func, optional): A Resnet model from torchvision.
            Default: models.resnet101
        pretrained (bool, optional): Use pretrained version of resnet
            Default: True
        freeze_resnet (bool, optional): Freeze resnet model
            Default: True

    Raises:
        ValueError: size of input_shape not divisible by 32
    """
    super(BaseRefineNet4Cascade,self).__init__()

    input_channel, input_size = input_shape

    if input_size % 32 != 0:
        raise ValueError("{} not divisble by 32".format(input_shape))

    resnet = resnet_factory(pretrained=pretrained)

    self.layer1 = nn.Sequential(
        resnet.conv1,
        resnet.bn1,
        resnet.relu,
        resnet.maxpool,
        resnet.layer1
    )

    self.layer2 = resnet.layer2
    self.layer3 = resnet.layer3
    self.layer4 = resnet.layer4


    self.layer1_rn = nn.Conv2d(
        256, features, kernel_size=3, stride=1, padding=1, bias=False)
    self.layer2_rn = nn.Conv2d(
        512, features, kernel_size=3, stride=1, padding=1, bias=False)
    self.layer3_rn = nn.Conv2d(
        1024, features, kernel_size=3, stride=1, padding=1, bias=False)
    self.layer4_rn = nn.Conv2d(
        2048, 2 * features, kernel_size=3, stride=1, padding=1, bias=False)

    self.refinenet4 = RefineNetBlock(
        2 * features, (2 * features, input_size // 32))
    self.refinenet3 = RefineNetBlock(
        features, (2 * features, input_size // 32), (features, input_size // 16))
    self.refinenet2 = RefineNetBlock(
        features, (features, input_size // 16), (features, input_size // 8))
    self.refinenet1 = RefineNetBlock(
        features, (features, input_size // 8), (features, input_size // 4))

    self.output_conv = nn.Sequential(
        ResidualConvUnit(features),
        ResidualConvUnit(features),
        nn.Conv2d(features, num_classes, kernel_size=1, stride=1, padding=0, bias=True)
    )

def forward(self, x):

    layer_1 = self.layer1(x)
    layer_2 = self.layer2(layer_1)
    layer_3 = self.layer3(layer_2)
    layer_4 = self.layer4(layer_3)

    layer_1_rn = self.layer1_rn(layer_1)
    layer_2_rn = self.layer2_rn(layer_2)
    layer_3_rn = self.layer3_rn(layer_3)
    layer_4_rn = self.layer4_rn(layer_4)

    path_4 = self.refinenet4(layer_4_rn)
    path_3 = self.refinenet3(path_4, layer_3_rn)
    path_2 = self.refinenet2(path_3, layer_2_rn)
    path_1 = self.refinenet1(path_2, layer_1_rn)
    out = self.output_conv(path_1)
    return out

class RefineNet4Cascade(BaseRefineNet4Cascade):

def __init__(self, input_shape,
             num_classes=2,
             features=256,
             resnet_factory=models.resnet101,
             pretrained=True,
             freeze_resnet=False):
    """Multi-path 4-Cascaded RefineNet for image segmentation

    Args:
        input_shape ((int, int)): (channel, size) assumes input has
            equal height and width
        refinenet_block (block): RefineNet Block
        num_classes (int, optional): number of classes
        features (int, optional): number of features in refinenet
        resnet_factory (func, optional): A Resnet model from torchvision.
            Default: models.resnet101
        pretrained (bool, optional): Use pretrained version of resnet
            Default: True
        freeze_resnet (bool, optional): Freeze resnet model
            Default: True

    Raises:
        ValueError: size of input_shape not divisible by 32
    """
    super(RefineNet4Cascade,self).__init__(input_shape, RefineNetBlock,
                     num_classes=num_classes, features=features,
                     resnet_factory=resnet_factory, pretrained=pretrained,
                     freeze_resnet=freeze_resnet)

drdlfy · January 21, 2018, 6:10am

Hello, a bit more code, an image segmentation model, so you can see where the problem appears? Thank you very much

jpeg729 · January 21, 2018, 12:13pm

I should have asked for a stack trace as well. Nevertheless I will hasard a guess.

Have you tried replacing nn.ReLU(inplace=True) with nn.ReLU()?

Besides the line x = self.relu(x) is confused because it does two things.

it applies relu to x inplace thus modifying the input data
it then reassigns x to x which is pointless given that x has already been modified inplace.

The line out = self.relu(x) is worse because it does not make it clear that x is modified inplace by the relu operation. Readability is important.

My guess is that trying to optimise by using inplace operations will easily lead to confusion, frustration and probably not a huge improvement in efficiency. So I would suggest getting the code to work without inplace operations, and only then try adding some.

drdlfy · January 22, 2018, 8:45am

Thank you very much, indeed the error caused by relu, now you can work normally, thank you very much, I study well nn.ReLU(inplace=True)

ginobilinie · February 6, 2018, 10:45pm

Hi, do you solve it? I encounter the same problem when I try to run the refinenet.

I have replaced the nn.ReLU(inplace=True) with nn.ReLU, but the same error is still there.

Do you make any other changes to make it go well?

drdlfy · February 7, 2018, 2:07am

I have solved this problem by replacing nn.ReLU (inplace = True) with nn.ReLU. It seems that no other changes

hasakii · November 16, 2018, 8:57am

It would be the problem with shortcut connection:

x += f(x)

keep in mind that += is inplace assign add.