python source code of h5

from __future__ import print_function

import h5py
import os
import numpy as np
import cv2
import argparse
import random
import itertools
from tqdm import tqdm, trange
from sklearn.utils import shuffle
from keras.preprocessing.image import ImageDataGenerator

# Save current python dir path
dir_path = os.path.dirname(os.path.realpath('__file__'))

parser = argparse.ArgumentParser()
parser.add_argument("--path", help="path of leftImg8bit folder.", default='/run/media/tkwoo/myWorkspace/workspace/01.dataset/cityscape/leftImg8bit')
parser.add_argument("--gtpath", help="path of gtFine folder.", default='/run/media/tkwoo/myWorkspace/workspace/01.dataset/cityscape/gtFine')

args = parser.parse_args()
img_folder_path = args.path
gt_folder_path = args.gtpath

# Use only 3 classes.
labels = ['background', 'person', 'car', 'road']

def get_data(mode):
    if mode == 'train' or mode == 'val' or mode == 'test':
        x_paths = []
        y_paths = []
        tmp_img_folder_path = os.path.join(img_folder_path, mode)
        tmp_gt_folder_path = os.path.join(gt_folder_path, mode)

        # os.walk helps to find all files in directory.
        for (path, dirname, files) in sorted(os.walk(tmp_img_folder_path)):
            for filename in sorted(files):
                x_paths.append(os.path.join(path, filename))

        # Find ground_truth file paths with x_paths.
        idx = len(tmp_img_folder_path)
        for x_path in x_paths:
            y_paths.append(tmp_gt_folder_path + x_path[idx:-15] + 'gtFine_labelIds.png')

        return x_paths, y_paths
    else:
        print("Please call get_data function with arg 'train', 'val', 'test'.")

def write_data(h5py_file, mode, x_paths, y_paths):
    num_data = len(x_paths)

    uint8_dt = h5py.special_dtype(vlen=np.uint8)
    string_dt = h5py.special_dtype(vlen=str)

    group = h5py_file.create_group(mode)
    h5_name = group.create_dataset('name', shape=(num_data,), dtype=string_dt)
    h5_image = group.create_dataset('image', shape=(num_data,), dtype=uint8_dt)
    h5_label = group.create_dataset('label', shape=(num_data,), dtype=uint8_dt)

    h5_image.attrs['size'] = [256,512,3]
    h5_label.attrs['size'] = [256,512,1]

    for i in range(num_data):
        x_img = cv2.imread(x_paths[i], 1)
        y_img = cv2.imread(y_paths[i], 0)
        x_img = cv2.resize(x_img, None, fx=0.25, fy=0.25, interpolation=cv2.INTER_LINEAR)
        y_img = cv2.resize(y_img, None, fx=0.25, fy=0.25, interpolation=cv2.INTER_NEAREST)

        h5_image[i] = x_img.flatten()
        h5_label[i] = y_img.flatten()
        h5_name[i] = os.path.basename(x_paths[i])

        # break

def make_h5py():
    x_train_paths, y_train_paths = get_data('train')
    x_val_paths, y_val_paths = get_data('val')
    x_test_paths, y_test_paths = get_data('test')

    h5py_file = h5py.File(os.path.join(dir_path, 'data.h5'), 'w')
    
    start = cv2.getTickCount()
    write_data(h5py_file, 'train', x_train_paths, y_train_paths)
    time = (cv2.getTickCount()-start)/cv2.getTickFrequency()
    print ('parsing train data, Time:%.3fs'%time)

    start = cv2.getTickCount()
    write_data(h5py_file, 'val', x_val_paths, y_val_paths)
    time = (cv2.getTickCount()-start)/cv2.getTickFrequency()
    print ('parsing val data, Time:%.3fs'%time)

    start = cv2.getTickCount()
    write_data(h5py_file, 'test', x_test_paths, y_test_paths)
    time = (cv2.getTickCount()-start)/cv2.getTickFrequency()
    print ('parsing test data, Time:%.3fs'%time)

def read_h5py_example():
    h5_in = h5py.File(os.path.join(dir_path, 'data.h5'), 'r')
    print (h5_in.keys())
    print (h5_in['train']['image'].dtype)
    print (h5_in['train']['image'][0].shape)

    image_size = h5_in['train']['image'].attrs['size']
    label_size = h5_in['train']['label'].attrs['size']

    x_img = np.reshape(h5_in['train']['image'][0], tuple(image_size))
    y_img = np.reshape(h5_in['train']['label'][0], tuple(label_size))
    name = h5_in['train']['name'][0]
    print (name)
    y_img = (y_img.astype(np.float32)*255/33).astype(np.uint8)
    y_show = cv2.applyColorMap(y_img, cv2.COLORMAP_JET)
    show = cv2.addWeighted(x_img, 0.5, y_show, 0.5, 0)
    cv2.imshow("show", show)
    cv2.waitKey()

def h5py_test():
    h5_in = h5py.File(os.path.join(dir_path, 'cityscape.h5'), 'r')
    h5_name = h5_in['train']['name'] #.get('/train/name')
    h5_image = h5_in['train']['image'] #.get('/train/image')
    h5_label = h5_in['train']['label'] #.get('/train/label')

    shuffle_indexes = np.array(shuffle(range(len(h5_image))))

    batch_size = 32

    print (len(h5_image))
    print (len(shuffle_indexes))
    print (len(shuffle_indexes)//batch_size)

    image_size = h5_in['train']['image'].attrs['size']
    label_size = h5_in['train']['label'].attrs['size']

    # reshape_image_size = tuple(np.insert(image_size, 0, len(h5_image)))
    # reshape_label_size = tuple(np.insert(label_size, 0, len(h5_label)))

    # print(h5_image[0:10].astype(type(h5_image[0])).dtype)
    
    print (h5_image[:10])
    print ('shape:',h5_image[:10].shape)
    print ('dtype:',h5_image[:10].dtype)
    print ('type of element:',type(h5_image[:10][0]))
    
    # for idx in range(len(shuffle_indexes)//batch_size):
    #     x_img = np.array(h5_image[shuffle_indexes[idx:idx+batch_size]].tolist())

    exit()

    # faster than reading image files
    x_img = np.array(h5_image[:].tolist())
    y_img = np.array(h5_label[:].tolist())

    print (x_img.shape)

    x_img = np.reshape(x_img, reshape_image_size)
    y_img = np.reshape(y_img, reshape_label_size)

    datagen_args = dict(
                featurewise_center=False,  # set input mean to 0 over the dataset
                samplewise_center=False,  # set each sample mean to 0
                featurewise_std_normalization=False,  # divide inputs by std of the dataset
                samplewise_std_normalization=False,  # divide each input by its std
                zca_whitening=False,  # apply ZCA whitening
                rotation_range=10,  # randomly rotate images in the range (degrees, 0 to 180)
                width_shift_range=0.1,  # randomly shift images horizontally (fraction of total width)
                height_shift_range=0.1,  # randomly shift images vertically (fraction of total height)
                fill_mode='constant',
                # cval=0.,
                horizontal_flip=False,  # randomly flip images
                vertical_flip=False)  # randomly flip images

    image_datagen = ImageDataGenerator(**datagen_args)
    mask_datagen = ImageDataGenerator(**datagen_args)

    x_img = x_img.astype(np.float32)
    y_img = y_img.astype(np.float32)

    seed = random.randrange(1, 1000)
    # image_datagen.fit(np_x, augment=True, seed=seed)
    # mask_datagen.fit(np_y, augment=True, seed=seed)
    start = cv2.getTickCount()
    img_gen = image_datagen.flow(x_img, batch_size=32, shuffle=True, seed=seed)
    mask_gen = mask_datagen.flow(y_img, batch_size=32, shuffle=True, seed=seed)
    time = (cv2.getTickCount() - start) / cv2.getTickFrequency() * 1000
    print ('flow time : %.2f ms'%time)
    
    start = cv2.getTickCount()

    for img, label in itertools.izip(img_gen, mask_gen):
        
        img = img.astype(np.uint8)
        label = label.astype(np.uint8)
        cv2.imshow('temp', img[0])
        cv2.imshow('label', label[0])
        key = cv2.waitKey(1)
        if key == 27:
            break
        time = (cv2.getTickCount() - start) / cv2.getTickFrequency() * 1000
        print ('read time : %.2f ms'%time)
    exit()

    # x_img = x_img[0]
    # y_img = y_img[0]

    # y_img = (y_img.astype(np.float32)*255/33).astype(np.uint8)
    # y_show = cv2.applyColorMap(y_img, cv2.COLORMAP_JET)
    # show = cv2.addWeighted(x_img, 0.5, y_show, 0.5, 0)
    # cv2.imshow("show", show)
    # cv2.waitKey()
    # # print (h5_image.shape)
    # # print (type(h5_image))
    # # print (type(h5_image[0]))

def image_copy_to_dir(mode, x_paths, y_paths):
    target_path = '/run/media/tkwoo/myWorkspace/workspace/01.dataset/03.Mask_data/cityscape'
    target_path = os.path.join(target_path, mode)

    for idx in trange(len(x_paths)):
        image = cv2.imread(x_paths[idx], 1)
        mask = cv2.imread(y_paths[idx], 0)

        image = cv2.resize(image, None, fx=0.25, fy=0.25, interpolation=cv2.INTER_LINEAR)
        mask = cv2.resize(mask, None, fx=0.25, fy=0.25, interpolation=cv2.INTER_NEAREST)

        cv2.imwrite(os.path.join(target_path, 'image', os.path.basename(x_paths[idx])), image)
        cv2.imwrite(os.path.join(target_path, 'mask', os.path.basename(y_paths[idx])), mask)

        # show = image.copy()
        # mask = (mask.astype(np.float32)*255/33).astype(np.uint8)
        # mask_color = cv2.applyColorMap(mask, cv2.COLORMAP_JET)
        # show = cv2.addWeighted(show, 0.5, mask_color, 0.5, 0.0)
        # cv2.imshow('show', show)
        # key = cv2.waitKey(1)
        # if key == 27:
        #     return

def image_collection():
    x_train_paths, y_train_paths = get_data('train')
    x_val_paths, y_val_paths = get_data('val')
    x_test_paths, y_test_paths = get_data('test')

    image_copy_to_dir('train', x_train_paths, y_train_paths)
    image_copy_to_dir('val', x_val_paths, y_val_paths)
    image_copy_to_dir('test', x_test_paths, y_test_paths)

if __name__=='__main__':
    # make_h5py() # cityscape -> 2.5GB h5 file
    # read_h5py_example()
    h5py_test()
    # image_collection()