forked from pbcquoc/crnn
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathloader.py
More file actions
133 lines (103 loc) · 3.87 KB
/
loader.py
File metadata and controls
133 lines (103 loc) · 3.87 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
import torchvision
import torch
import os
import torch.utils.data as data
from PIL import Image
import numpy as np
import argparse
import time
from multiprocessing import cpu_count
import uuid
from models.utils import resizePadding
def img_loader(path):
img = Image.open(path).convert('RGB')
return img
def train_transform(path):
pass
def test_transform(path):
pass
def target_loader(path):
label = open(path).read().rstrip('\n')
return label
def default_flist_reader(flist):
imlist = []
img_exts = ('jpg', 'png', 'JPG', 'PNG')
with open(flist) as rf:
for line in rf.readlines():
impath = line.strip()
if impath.endswith(img_exts):
imlabel = os.path.splitext(impath)[0] + '.txt'
imlist.append((impath, imlabel))
return imlist
class ImageFileList(data.Dataset):
def __init__(self, root, flist, transform, target_transform,
flist_reader=default_flist_reader):
self.root = root
self.imlist = flist_reader(flist)
self.transform = transform
self.target_transform = target_transform
def __getitem__(self, index):
impath, targetpath = self.imlist[index]
imgpath = os.path.join(self.root,impath)
targetpath = os.path.join(self.root,targetpath)
img = self.transform(imgpath)
target = self.target_transform(targetpath)
return img, target
def __len__(self):
return len(self.imlist)
class alignCollate(object):
def __init__(self, imgW, imgH):
self.imgH = imgH
self.imgW = imgW
def __call__(self, batch):
images, labels = zip(*batch)
imgH = self.imgH
imgW = self.imgW
images = [resizePadding(image, self.imgW, self.imgH) for image in images]
images = torch.cat([t.unsqueeze(0) for t in images], 0)
return images, labels
class DatasetLoader(object):
def __init__(self, root, train_file, test_file, imgW, imgH):
self.root = root
self.train_file = os.path.join(root, train_file)
self.test_file = os.path.join(root, test_file)
self.imgW = imgW
self.imgH = imgH
self.train_dataset = ImageFileList(root, self.train_file, transform=img_loader, target_transform=target_loader)
self.test_dataset = ImageFileList(root, self.test_file, transform=img_loader, target_transform=target_loader)
def train_loader(self, batch_size, num_workers=4, shuffle=True):
train_loader = torch.utils.data.DataLoader(
self.train_dataset,
batch_size=batch_size,
num_workers=num_workers,
shuffle=True,
collate_fn=alignCollate(self.imgW, self.imgH)
)
return train_loader
def test_loader(self, batch_size, num_workers=4, shuffle=True):
test_loader = torch.utils.data.DataLoader(
self.test_dataset,
batch_size=batch_size,
num_workers=num_workers,
shuffle=True,
collate_fn=alignCollate(self.imgW, self.imgH)
)
return test_loader
def main():
parser = argparse.ArgumentParser()
parser.add_argument('--root', required=True, help='path to root folder')
parser.add_argument('--train', required=True, help='path to train list')
parser.add_argument('--val', required=True, help='path to test list')
opt = parser.parse_args()
loader = DatasetLoader(opt.root, opt.train, opt.val, 512, 32)
for _ in range(100):
train_loader = iter(loader.train_loader(64, num_workers=cpu_count()))
i = 0
while i < len(train_loader):
start_time = time.time()
X_train, y_train = next(train_loader)
elapsed_time = time.time() - start_time
i += 1
print(i, elapsed_time, X_train.size())
if __name__ == '__main__':
main()