Run time error with embeddings

Jordan_Howell · April 30, 2020, 8:01pm

Hello,

I’m trying to get this model to run and I keep getting the following error:

BTW, I checked out this but it didn’t really help my error…or I didn’t understand it: Expected tensor for argument #1 'indices' to have scalar type Long; but got CPUFloatTensor instead (while checking arguments for embedding)

---------------------------------------------------------------------------
RuntimeError                              Traceback (most recent call last)
<ipython-input-778-34aa93336f9e> in <module>
     94 
     95         # Forward pass
---> 96         outputs = tab_model(numerical_data, categorical_data, train_tensor)
     97         loss = criterion(outputs, label)
     98         print(f"tab epoch: {epoch}, tab loss: {loss}")

~\AppData\Local\Continuum\anaconda3\envs\torch_env\lib\site-packages\torch\nn\modules\module.py in __call__(self, *input, **kwargs)
    530             result = self._slow_forward(*input, **kwargs)
    531         else:
--> 532             result = self.forward(*input, **kwargs)
    533         for hook in self._forward_hooks.values():
    534             hook_result = hook(self, input, result)

<ipython-input-775-fc3cf1d18657> in forward(self, x_categorical, x_numerical, predictions)
     35         embeddings = []
     36         for i, e in enumerate(self.all_embeddings):
---> 37             embeddings.append(e(x_categorical[:,i]).type(torch.LongTensor))
     38 
     39         cat_embedd = torch.cat(embeddings, 1)

~\AppData\Local\Continuum\anaconda3\envs\torch_env\lib\site-packages\torch\nn\modules\module.py in __call__(self, *input, **kwargs)
    530             result = self._slow_forward(*input, **kwargs)
    531         else:
--> 532             result = self.forward(*input, **kwargs)
    533         for hook in self._forward_hooks.values():
    534             hook_result = hook(self, input, result)

~\AppData\Local\Continuum\anaconda3\envs\torch_env\lib\site-packages\torch\nn\modules\sparse.py in forward(self, input)
    112         return F.embedding(
    113             input, self.weight, self.padding_idx, self.max_norm,
--> 114             self.norm_type, self.scale_grad_by_freq, self.sparse)
    115 
    116     def extra_repr(self):

~\AppData\Local\Continuum\anaconda3\envs\torch_env\lib\site-packages\torch\nn\functional.py in embedding(input, weight, padding_idx, max_norm, norm_type, scale_grad_by_freq, sparse)
   1482         # remove once script supports set_grad_enabled
   1483         _no_grad_embedding_renorm_(weight, input, max_norm, norm_type)
-> 1484     return torch.embedding(weight, input, padding_idx, scale_grad_by_freq, sparse)
   1485 
   1486 

RuntimeError: Expected tensor for argument #1 'indices' to have scalar type Long; but got torch.cuda.FloatTensor instead (while checking arguments for embedding)

Here is the modell:

class Data_Only_Model(nn.Module):
    def __init__(self, embedding_size):
        super().__init__()

        #list of ModuleList objects for all categorical columns
        self.all_embeddings = nn.ModuleList([nn.Embedding(ni, nf) for ni, nf in embedding_size])
        self.embedding_dropout = nn.Dropout(p = .04)
        
        self.fc1 = nn.Linear(78, 1000)
        self.fc2 = nn.BatchNorm1d(1000)
        self.fc3 = nn.Dropout(p = .04)
        self.fc4= nn.Linear(1000, 256)
        self.fc5= nn.BatchNorm1d(256)
        self.fc6= nn.Dropout(p = .04)  
        self.fc7= nn.Linear(256, 128)
        self.fc8= nn.BatchNorm1d(128)
        self.fc9= nn.Dropout(p = .04)                            
        self.fc10= nn.Linear(128, 32)
        self.fc11= nn.BatchNorm1d(32)
        self.fc12= nn.Dropout(p = .04)
        self.fc13= nn.Linear(32, 2)
  
    #define the foward method
    def forward(self, x_categorical, x_numerical, predictions):
        embeddings = []
        for i, e in enumerate(self.all_embeddings):
            embeddings.append(e(x_categorical[:,i]))
            
        cat_embedd = torch.cat(embeddings, 1)
        print("cat", x.size())

        numerical = x_numerical
        print("numerical", numerical.size())
        x = torch.cat((cat_embedd, x_numerical), dim = 1)
        print('1 concat', x.size())
        x4 = torch.cat((x, predictions), dim = 1)
        print('X4', x4.size())
              
        
        
        x4 = F.relu(self.fc1(x4))
        x4 = self.fc2(x4)
        x4 = self.fc3(x4)
        x4 = self.fc4(x4)
        x4 = self.fc5(x4)
        x4 = self.fc6(x4)
        x4 = F.relu(self.fc7(x4))
        x4 = self.fc8(x4)
        x4 = self.fc9(x4)
        x4 = F.relu(self.fc10(x4))
        x4 = self.fc11(x4)
        x4 = self.fc12(x4)
        x4 = self.fc13(x4)
        x4 = F.log_softmax(x4)
        return x4

tab_model = Data_Only_Model(embedding_size=embeddings)
tab_model.to(device)

Data_Only_Model(
  (all_embeddings): ModuleList(
    (0): Embedding(3, 2)
    (1): Embedding(20, 10)
    (2): Embedding(3007, 50)
    (3): Embedding(48, 24)
    (4): Embedding(4, 2)
    (5): Embedding(6, 3)
    (6): Embedding(6, 3)
    (7): Embedding(15, 8)
    (8): Embedding(3, 2)
    (9): Embedding(10, 5)
    (10): Embedding(13, 7)
  )
  (embedding_dropout): Dropout(p=0.04, inplace=False)
  (fc1): Linear(in_features=78, out_features=1000, bias=True)
  (fc2): BatchNorm1d(1000, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc3): Dropout(p=0.04, inplace=False)
  (fc4): Linear(in_features=1000, out_features=256, bias=True)
  (fc5): BatchNorm1d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc6): Dropout(p=0.04, inplace=False)
  (fc7): Linear(in_features=256, out_features=128, bias=True)
  (fc8): BatchNorm1d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc9): Dropout(p=0.04, inplace=False)
  (fc10): Linear(in_features=128, out_features=32, bias=True)
  (fc11): BatchNorm1d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc12): Dropout(p=0.04, inplace=False)
  (fc13): Linear(in_features=32, out_features=2, bias=True)
)

I’m not sure where I’ve gone wrong.

ptrblck · May 1, 2020, 1:43am

It seems x_categorical is a FloatTensor instead of a LongTensor.
You could fix this via x_categorical = x_categorical.long().

Jordan_Howell · May 1, 2020, 9:25am

So i’m still getting the long error after I cast the categorical as type long.

ptrblck · May 2, 2020, 3:36am

Note that you are trying to cast the output of the embedding layer in this line of code:

e(x_categorical[:,i]).type(torch.LongTensor)

while the input is expected to be a LongTensor. Could this be the error?

Jordan_Howell · May 3, 2020, 12:44am

I took that out. Even before that, I had the following line in my loop that cast x_categorical to a long tensor:

def tab_run(train_predictions, test_predictions):
    for epoch in range(epochs):
        for label, policy, categorical_data, numerical_data in train_loader_tab:
            # move data to GPU
            label = label.long()
            label = label.to(device)
            categorical_data = categorical_data.long()
            categorical_data = categorical_data.to(device)
            numerical_data = numerical_data.to(device)
            train_predictions = train_predictions.to(device)
        #         print(categorical_data.size(), label.size())
            # zero the parameter gradients
            optimizer.zero_grad()

            # Forward pass
            outputs = tab_model(numerical_data, categorical_data, train_predictions)
            loss = criterion(outputs, label)
            print(f"tab epoch: {epoch}, tab loss: {loss}")
            # Backward and optimize
            loss.backward()
            optimizer.step()

        for label, policy, categorical_data, numerical_data in test_loader_tab:
            # move data to GPU

            label = label.to(device)
            policy = policy.to(device)
            categorical_data = categorical_data.to(device)
            numerical_data = numerical_data.to(device)
            test_predictions = test_predictions.to(device)

            outputs = tab_model(numerical_data, categorical_data, test_predictions)
            loss = criterion(outputs, label)
            test_loss.append(loss.item())

        #         print(f"test epoch: {epoch}, test loss: {loss}")

        dt = datetime.now() - t0
        print('Duration:', dt)
        
tab_run(train_predictions = train_tensor, test_predictions = test_tensor)

Here is the error it gives after that:

---------------------------------------------------------------------------
RuntimeError                              Traceback (most recent call last)
<ipython-input-62-d89c1efcb9b3> in <module>
     39         print('Duration:', dt)
     40 
---> 41 tab_run(train_predictions = train_tensor, test_predictions = test_tensor)

<ipython-input-62-d89c1efcb9b3> in tab_run(train_predictions, test_predictions)
     14 
     15             # Forward pass
---> 16             outputs = tab_model(numerical_data, categorical_data, train_predictions)
     17             loss = criterion(outputs, label)
     18             print(f"tab epoch: {epoch}, tab loss: {loss}")

~\AppData\Local\Continuum\anaconda3\envs\torch_env\lib\site-packages\torch\nn\modules\module.py in __call__(self, *input, **kwargs)
    530             result = self._slow_forward(*input, **kwargs)
    531         else:
--> 532             result = self.forward(*input, **kwargs)
    533         for hook in self._forward_hooks.values():
    534             hook_result = hook(self, input, result)

<ipython-input-55-1bdc8b23721e> in forward(self, x_categorical, x_numerical, predictions)
     35         embeddings = []
     36         for i, e in enumerate(self.all_embeddings):
---> 37             embeddings.append(e(x_categorical[:,i]))
     38 
     39         cat_embedd = torch.cat(embeddings, 1)

~\AppData\Local\Continuum\anaconda3\envs\torch_env\lib\site-packages\torch\nn\modules\module.py in __call__(self, *input, **kwargs)
    530             result = self._slow_forward(*input, **kwargs)
    531         else:
--> 532             result = self.forward(*input, **kwargs)
    533         for hook in self._forward_hooks.values():
    534             hook_result = hook(self, input, result)

~\AppData\Local\Continuum\anaconda3\envs\torch_env\lib\site-packages\torch\nn\modules\sparse.py in forward(self, input)
    112         return F.embedding(
    113             input, self.weight, self.padding_idx, self.max_norm,
--> 114             self.norm_type, self.scale_grad_by_freq, self.sparse)
    115 
    116     def extra_repr(self):

~\AppData\Local\Continuum\anaconda3\envs\torch_env\lib\site-packages\torch\nn\functional.py in embedding(input, weight, padding_idx, max_norm, norm_type, scale_grad_by_freq, sparse)
   1482         # remove once script supports set_grad_enabled
   1483         _no_grad_embedding_renorm_(weight, input, max_norm, norm_type)
-> 1484     return torch.embedding(weight, input, padding_idx, scale_grad_by_freq, sparse)
   1485 
   1486 

RuntimeError: Expected tensor for argument #1 'indices' to have scalar type Long; but got torch.cuda.FloatTensor instead (while checking arguments for embedding)

ptrblck · May 3, 2020, 12:57am

Could you post an executable code snippet using random inputs, which recreates this issue, so that we could debug it, please?

Jordan_Howell · May 3, 2020, 8:37pm

I think I may have it! I am getting a different error trying to concatenate a tensor of size [431, 2] with my categorical and numeric data. The tensor consists of predictions from two image models that I want to concatenate with tabular data. The error is:

---------------------------------------------------------------------------
RuntimeError                              Traceback (most recent call last)
<ipython-input-243-186b3ea7dfcf> in <module>
     39         print('Duration:', dt)
     40 
---> 41 tab_run(train_predictions = train_tensor, test_predictions = test_tensor)

<ipython-input-243-186b3ea7dfcf> in tab_run(train_predictions, test_predictions)
     14 
     15             # Forward pass
---> 16             outputs = tab_model(categorical_data, numerical_data, train_predictions)
     17             loss = criterion(outputs, label)
     18             print(f"tab epoch: {epoch}, tab loss: {loss}")

~\AppData\Local\Continuum\anaconda3\envs\torch_env\lib\site-packages\torch\nn\modules\module.py in __call__(self, *input, **kwargs)
    530             result = self._slow_forward(*input, **kwargs)
    531         else:
--> 532             result = self.forward(*input, **kwargs)
    533         for hook in self._forward_hooks.values():
    534             hook_result = hook(self, input, result)

<ipython-input-241-49f06acf2d93> in forward(self, x_categorical, x_numerical, predictions)
     45 #         x = x.float()
     46         print('1 concat', x.size())
---> 47         x4 = torch.cat((x, predictions), dim = 1)
     48         print('X4', x4.size())
     49 

RuntimeError: invalid argument 0: Sizes of tensors must match except in dimension 1. Got 431 and 1 in dimension 0 at C:/w/1/s/tmp_conda_3.7_100118/conda/conda-bld/pytorch_1579082551706/work/aten/src\THC/generic/THCTensorMath.cu:71

These tensors are outside the data loader. I’m not sure if that matters.

def tab_run(train_predictions, test_predictions):
    train_predictions = train_predictions.to(device)
    test_predictions = test_predictions.to(device)
    for epoch in range(epochs):
        for label, policy, categorical_data, numerical_data in train_loader_tab:
            # move data to GPU
            label = label.long()
            label = label.to(device)
            categorical_data = categorical_data.long()
            categorical_data = categorical_data.to(device)
            numerical_data = numerical_data.to(device)


            # zero the parameter gradients
            optimizer.zero_grad()

            # Forward pass
            outputs = tab_model(categorical_data, numerical_data, train_tensor)
            loss = criterion(outputs, label)
            print(f"tab epoch: {epoch}, tab loss: {loss}")
            # Backward and optimize
            loss.backward()
            optimizer.step()

        for label, policy, categorical_data, numerical_data in test_loader_tab:
            # move data to GPU

            label = label.to(device)
            policy = policy.to(device)
            categorical_data = categorical_data.to(device)
            numerical_data = numerical_data.to(device)
            #predictions come in here


            outputs = tab_model(categorical_data, numerical_data, test_predictions)
            loss = criterion(outputs, label)
            test_loss.append(loss.item())

        #         print(f"test epoch: {epoch}, test loss: {loss}")

        dt = datetime.now() - t0
        print('Duration:', dt)
        
tab_run(train_predictions = train_tensor, test_predictions = test_tensor)

ptrblck · May 4, 2020, 12:28am

To concatenate two tensors in a specific dimension, all other dimension shapes should match.
In your case dim0 differs with the shapes 431 and 1, repectively.
I’m not sure how these tensors are used, but usually dim0 refers to the batch dimension and I would expect this dimension to have the same size.