Albumentation Transforms cannot differentiate between train and validation transforms

Atia · March 17, 2022, 11:47am

Hello, I have created a data pipeline to make train, validation and test sets with various augmentations using albumentations with the code below

class GetDataset(Dataset):
    def __init__(self,imgDir: str,dataset: pd.DataFrame,transform=None,labeled=True):
        self.imgDir = imgDir
        self.dataset = dataset
        self.labeled = labeled
        self.transform = transform
#         self.training = training
        
        
    def __len__(self) -> int:
        return len(self.dataset)
    
    def __getitem__(self,idx: int) -> tuple:
        img_path = os.path.join(self.imgDir,self.dataset['image'].iloc[idx])
        image = cv2.imread(img_path)
#         image = Image.open(img_path).convert('RGB')
        image = cv2.cvtColor(image,cv2.COLOR_BGR2RGB) # may change to GrayScale.
        if self.transform is not None:
            image = self.transform(image=image)['image'].astype(np.float32)
            image = image.transpose(2,1,0)
            image = torch.tensor(image)
            if self.labeled:
                target = torch.tensor(self.dataset['individual_label'].iloc[idx])
                return image,target
            else:
                return image
        
def transform_ds(trainFlag=True):
    if trainFlag:
        return A.Compose([
            # starting with spatial transforms
            A.Resize(224,224),
            A.HorizontalFlip(p=0.5),
            A.VerticalFlip(p=0.5),
            A.RandomRotate90(p=0.5),
            # pixel-wise transforms
#             T.Grayscale(3),
            A.GaussianBlur(blur_limit=(3,3),p=0.2),
            A.ColorJitter(0.45,0.45,0.45,0.45),
#             A.CLAHE(p=0.5),
            A.Normalize(mean=(0.485, 0.456, 0.406), std=(0.229, 0.224, 0.225)),
        ])
    else:
        return A.Compose([
            A.Resize(224,224),
#             T.Grayscale(3),
            A.Normalize(mean=(0.485, 0.456, 0.406), std=(0.229, 0.224, 0.225)),
        ])

And I use the code below to create my train,validation and test datasets

tex = GetDataset(train_imgs,df_copy,transform=transform_ds(trainFlag=True))
vex = GetDataset(train_imgs,df_copy,transform=transform_ds(trainFlag=False))

tester = GetDataset(test_imgs,test_copy,transform=transform_ds(trainFlag=False),labeled=False)

indices = torch.randperm(len(df_copy)).tolist()
train_eg = torch.utils.data.Subset(tex,indices[:-1000])
val_eg = torch.utils.data.Subset(vex,indices[-1000:])
ex_t = DataLoader(train_eg,shuffle=True,batch_size=16)
ex_v = DataLoader(val_eg,shuffle=True,batch_size=16)
test = DataLoader(tester,batch_size=16)

but when I try to visualize them I realize that my validation set uses the same augmentations as my train set even though I am explicitely using the trainFlag to control what transforms are applied to what. I noticed that this behavior only works when I use transforms from albumentation however the code works as expected when I use torchvision transforms.

ptrblck · March 18, 2022, 6:36am

Your code works for me using albumentations as seen here:

class GetDataset(Dataset):
    def __init__(self, transform=None):
        self.data = np.ones((10, 224, 224, 3)).astype(np.uint8)
        self.transform = transform
        
    def __getitem__(self, index):
        x = self.data[index]
        x = self.transform(image=x)
        return x
    
    def __len__(self):
        return len(self.data)
    
def transform_ds(trainFlag=True):
    if trainFlag:
        return albumentations.Compose([
            albumentations.transforms.GaussNoise(p=1.0)
        ])
    else:
        return albumentations.Compose([
            albumentations.transforms.Normalize(mean=(1., 1., 1.), std=(1., 1., 1.))
        ])
    
train_dataset = GetDataset(transform=transform_ds(trainFlag=True))
val_dataset = GetDataset(transform=transform_ds(trainFlag=False))

indices = torch.randperm(10).tolist()
train_eg = torch.utils.data.Subset(train_dataset, indices[:5])
val_eg = torch.utils.data.Subset(val_dataset,indices[5::])
ex_t = DataLoader(train_eg, shuffle=True, batch_size=5)
ex_v = DataLoader(val_eg, shuffle=True, batch_size=5)

a = next(iter(ex_t))
b = next(iter(ex_v))

If you print a and b you’ll see that the different transformations are applied and the trainFlag works properly.

Atia · March 18, 2022, 11:13am

Thank you for your response. I finally figured it out. I was not converting my images to tensors and because of that the transforms where showing me the images in a certain orientation. That got me confused into thinking the transforms were working. I still think its strange though but I believe it has to do with how albumentations reads images (ie using opencv) as opposed to how pytorch does it using PIL images. Thanks again.