in datasets/preprocessing.py [0:0]
def __init__(self,
resize=(256, 256),
crop=(224, 224),
color=(0.4, 0.4, 0.4, 0.2),
num_frames=8,
pad_missing=False,
augment=True,
normalize=True,
totensor=True,
):
self.resize = resize
self.crop = crop
self.augment = augment
self.num_frames = num_frames
self.pad_missing = pad_missing
if normalize:
assert totensor
if augment:
transforms = [
video_transforms.Resize(resize),
video_transforms.RandomCrop(crop),
video_transforms.RandomHorizontalFlip(),
video_transforms.ColorJitter(*color),
]
else:
transforms = [
video_transforms.Resize(resize),
video_transforms.CenterCrop(crop),
]
if totensor:
transforms += [volume_transforms.ClipToTensor()]
if normalize:
transforms += [tensor_transforms.Normalize(
mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])]
self.transform = video_transforms.Compose(transforms)