2020-01-24 14:32:37 -05:00
|
|
|
""" Dataset definition.
|
|
|
|
|
|
|
|
MNIST / CIFAR10
|
|
|
|
"""
|
2019-11-13 11:45:05 -05:00
|
|
|
import torch
|
|
|
|
from torch.utils.data import SubsetRandomSampler
|
|
|
|
import torchvision
|
|
|
|
|
2020-01-24 15:10:08 -05:00
|
|
|
#Train/Validation batch size.
|
2019-11-13 11:45:05 -05:00
|
|
|
BATCH_SIZE = 300
|
2020-01-24 15:10:08 -05:00
|
|
|
#Test batch size.
|
|
|
|
TEST_SIZE = BATCH_SIZE
|
2020-01-17 15:12:28 -05:00
|
|
|
#TEST_SIZE = 10000 #legerement +Rapide / + Consomation memoire !
|
2019-11-13 11:45:05 -05:00
|
|
|
|
2020-01-24 15:10:08 -05:00
|
|
|
#Wether to download data.
|
2020-01-20 11:05:40 -05:00
|
|
|
download_data=False
|
2020-01-24 15:10:08 -05:00
|
|
|
#Number of worker to use.
|
2020-01-20 17:09:31 -05:00
|
|
|
num_workers=2 #4
|
2020-01-24 15:10:08 -05:00
|
|
|
#Pin GPU memory
|
2020-01-20 11:05:40 -05:00
|
|
|
pin_memory=False #True :+ GPU memory / + Lent
|
|
|
|
|
2019-11-13 11:45:05 -05:00
|
|
|
#ATTENTION : Dataug (Kornia) Expect image in the range of [0, 1]
|
|
|
|
#transform_train = torchvision.transforms.Compose([
|
|
|
|
# torchvision.transforms.RandomHorizontalFlip(),
|
|
|
|
# torchvision.transforms.ToTensor(),
|
2020-01-20 17:09:31 -05:00
|
|
|
# torchvision.transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)), #CIFAR10
|
2019-11-13 11:45:05 -05:00
|
|
|
#])
|
|
|
|
transform = torchvision.transforms.Compose([
|
|
|
|
torchvision.transforms.ToTensor(),
|
2020-01-31 10:34:44 -05:00
|
|
|
# torchvision.transforms.Normalize((0.4914, 0.4822, 0.4465), (0.2023, 0.1994, 0.2010)), #CIFAR10
|
2019-11-13 11:45:05 -05:00
|
|
|
])
|
2020-01-20 17:09:31 -05:00
|
|
|
|
2020-01-31 10:34:44 -05:00
|
|
|
transform_train = torchvision.transforms.Compose([
|
|
|
|
#transforms.RandomHorizontalFlip(),
|
|
|
|
#transforms.RandomVerticalFlip(),
|
|
|
|
torchvision.transforms.ToTensor(),
|
|
|
|
])
|
2020-01-31 10:36:50 -05:00
|
|
|
#from RandAugment import RandAugment
|
|
|
|
# Add RandAugment with N, M(hyperparameter)
|
2020-01-31 10:34:44 -05:00
|
|
|
#transform_train.transforms.insert(0, RandAugment(n=2, m=30))
|
2020-01-20 17:09:31 -05:00
|
|
|
|
2019-12-04 12:28:32 -05:00
|
|
|
### Classic Dataset ###
|
2020-01-31 10:34:44 -05:00
|
|
|
#MNIST
|
|
|
|
#data_train = torchvision.datasets.MNIST("../data", train=True, download=True, transform=transform_train)
|
|
|
|
#data_val = torchvision.datasets.MNIST("../data", train=True, download=True, transform=transform)
|
|
|
|
#data_test = torchvision.datasets.MNIST("../data", train=False, download=True, transform=transform)
|
|
|
|
#CIFAR
|
|
|
|
data_train = torchvision.datasets.CIFAR10("../data", train=True, download=download_data, transform=transform_train)
|
|
|
|
data_val = torchvision.datasets.CIFAR10("../data", train=True, download=download_data, transform=transform)
|
2020-01-24 14:32:37 -05:00
|
|
|
data_test = torchvision.datasets.CIFAR10("../data", train=False, download=download_data, transform=transform)
|
2019-12-04 12:28:32 -05:00
|
|
|
|
2019-11-20 16:06:27 -05:00
|
|
|
train_subset_indices=range(int(len(data_train)/2))
|
2019-11-13 11:45:05 -05:00
|
|
|
val_subset_indices=range(int(len(data_train)/2),len(data_train))
|
2019-11-21 12:29:17 -05:00
|
|
|
#train_subset_indices=range(BATCH_SIZE*10)
|
|
|
|
#val_subset_indices=range(BATCH_SIZE*10, BATCH_SIZE*20)
|
2019-12-04 12:28:32 -05:00
|
|
|
|
2020-01-24 11:50:30 -05:00
|
|
|
dl_train = torch.utils.data.DataLoader(data_train, batch_size=BATCH_SIZE, shuffle=False, sampler=SubsetRandomSampler(train_subset_indices), num_workers=num_workers, pin_memory=pin_memory)
|
2020-01-31 10:34:44 -05:00
|
|
|
dl_val = torch.utils.data.DataLoader(data_val, batch_size=BATCH_SIZE, shuffle=False, sampler=SubsetRandomSampler(val_subset_indices), num_workers=num_workers, pin_memory=pin_memory)
|
2020-01-10 13:21:34 -05:00
|
|
|
dl_test = torch.utils.data.DataLoader(data_test, batch_size=TEST_SIZE, shuffle=False, num_workers=num_workers, pin_memory=pin_memory)
|