-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathdata_loader.py
More file actions
104 lines (96 loc) · 3.92 KB
/
data_loader.py
File metadata and controls
104 lines (96 loc) · 3.92 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
import os
import torch
import torchvision
import torchvision.transforms as transforms
import torchvision.datasets as datasets
from dataset import KMNIST49
def load_dataset(data_root, dataset_name, img_size, only_train=True, trans=None):
if dataset_name == 'mnist':
train_dataset = torchvision.datasets.MNIST(
root=data_root,
train=True,
download=True,
transform=transforms.Compose([
transforms.Resize((img_size, img_size)),
transforms.ToTensor(),
transforms.Normalize((0.5,), (0.5,)),
]))
test_dataset = torchvision.datasets.MNIST(
root=data_root,
train=False,
download=True,
transform=transforms.Compose([
transforms.Resize((img_size, img_size)),
transforms.ToTensor(),
transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5)),
]))
elif dataset_name == 'kmnist49':
train_dataset = KMNIST49(
root=data_root,
train=True,
download=True
)
test_dataset = KMNIST49(
root=data_root,
train=False,
download=True
)
elif dataset_name == 'cifar10':
train_dataset = torchvision.datasets.CIFAR10(
root=data_root,
train=True,
transform=transforms.Compose([
transforms.Resize((img_size, img_size)),
transforms.ToTensor(),
transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5)),
]),
download=True
)
test_dataset = torchvision.datasets.CIFAR10(
root=data_root,
train=False,
transform=transforms.Compose([
transforms.Resize((img_size, img_size)),
transforms.ToTensor(),
transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5)),
]),
download=True
)
else:
if not only_train:
train_root = os.path.join(data_root, dataset_name, 'train')
else:
train_root = os.path.join(data_root, dataset_name)
train_dataset = datasets.ImageFolder(
# root=os.path.join(data_root, dataset_name, 'train'),
root=train_root,
transform=transforms.Compose([
transforms.Resize((img_size, img_size)),
transforms.ToTensor(),
transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5)),
])
)
test_dataset = datasets.ImageFolder(
root=os.path.join(data_root, dataset_name, 'test'),
transform=trans) if not only_train else None
return train_dataset, test_dataset
class DataLoader(object):
def __init__(self, data_root, dataset_name, img_size, batch_size, with_label):
self.data_root = data_root
self.dataset_name = dataset_name
self.img_size = img_size
self.batch_size = batch_size
self.with_label = with_label
def get_loader(self, only_train=False, trans=None):
train_dataset, test_dataset = load_dataset(
self.data_root, self.dataset_name, self.img_size, only_train, trans)
train_loader = torch.utils.data.DataLoader(
train_dataset, batch_size=self.batch_size, shuffle=True, num_workers=4)
test_loader = torch.utils.data.DataLoader(
test_dataset, batch_size=self.batch_size, shuffle=True, num_workers=4) if not only_train else None
print(f'Total number of train data: {len(train_loader.dataset)}')
if not only_train:
print(f'Total number of test data: {len(test_loader.dataset)}')
if self.with_label:
print(f'Total number of classes: {len(train_dataset.classes)}\n')
return train_loader, test_loader