-
Notifications
You must be signed in to change notification settings - Fork 0
/
preprocess_data.py
31 lines (23 loc) · 851 Bytes
/
preprocess_data.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
import numpy as np
from tqdm import tqdm
## LOADING DATA
# path and file names
dir_path = './Data/'
img_file_name = 'train_images.npy'
labels_file_name = 'train_labels.npy'
print("Loading our dataset...")
# looading our model data
images = np.load(dir_path + img_file_name, allow_pickle=True)
labels = np.load(dir_path + labels_file_name, allow_pickle=True)
print("Preprocess start...")
stack_imgs = np.empty((len(images),) + images[0].shape, dtype='int8')
print("Stacking image data.")
for i, arr in enumerate(tqdm(images)):
stack_imgs[i] = arr
print("processing labels data.")
new_lbls = np.array(labels, dtype='int')
print("Stacking done. Statistics:-")
print("Image data shape: ", stack_imgs.shape)
print("Labels array shape: ", new_lbls.shape)
np.save(dir_path + img_file_name,stack_imgs)
np.save(dir_path + labels_file_name,new_lbls)