Powered by GitBook

Tensorflow Dataloader

1. Numpy

'''
    ModelNet dataset. Support ModelNet40, ModelNet10, XYZ and normal channels. Up to 10000 points.
'''

import os
import os.path
import json
import numpy as np
import sys
BASE_DIR = os.path.dirname(os.path.abspath(__file__))
ROOT_DIR = BASE_DIR
sys.path.append(os.path.join(ROOT_DIR, 'utils'))
import provider
from glob import glob 
import re
from tqdm import tqdm

def pc_normalize(pc):
    l = pc.shape[0]
    centroid = np.mean(pc, axis=0)
    pc = pc - centroid
    m = np.max(np.sqrt(np.sum(pc**2, axis=1)))
    pc = pc / m
    return pc

class ModelNetDataset():
    def __init__(self, root, batch_size = 32, npoints = 1024, split='train', normalize=False, normal_channel=False, modelnet10=True, cache_size=15000, shuffle=None):
        self.root = '/workspace/datasets/modelnet40_normal_resampled/'
        self.batch_size = batch_size
        self.npoints = npoints
        self.normalize = normalize
        self.normal_channel = normal_channel

        ###To be modified 
        # Dataset 1
        self.cat = ['vehicle','bycle','human' ]
        self.classes = dict(zip(self.cat, range(len(self.cat))))          

        shape_ids = {}
        shape_ids['train'] = glob('./human_*.npy')
        shape_ids['test'] = glob(./human_2*.npy')
        shape_names = ['human' for _ in range(len(shape_ids[split]))] #list

        self.datapath1 = [(shape_names[i], shape_ids[split][i]) for i in range(len(shape_ids[split]))]        

        # Dataset 2
        shape_ids2 = {}
        shape_ids2['train'] = glob('/./pointnet3_dataset_object_*.npy')
        shape_ids2['test'] = glob('./pointnet3_dataset_object_9*.npy')

        shape_names2 = []
        vehicle = [1.0, 0.0, 0.0]
        bycle = [0.0, 1.0, 0.0]
        human = [0.0, 0.0, 1.0]

        for i in tqdm(range(len(shape_ids2[split]))):
            strr = shape_ids2[split][i]
            arr_str = re.split('_|.npy',strr)

            load_path = './pointnet3_dataset_label_{}.npy'.format(arr_str[5])
            label = np.load(load_path)
            if label.tolist() == vehicle:
                shape_names2.append("vehicle")
            elif label.tolist() == bycle:
                shape_names2.append("bycle")
            elif label.tolist() == human:
                shape_names2.append("human")
            else:
                print("-------error")


        self.datapath2 = [(shape_names2[i], shape_ids2[split][i]) for i in range(len(shape_ids2[split]))]        
        self.datapath = np.row_stack([np.array(self.datapath1),np.array(self.datapath2)])


        self.cache_size = cache_size # how many data points to cache in memory
        self.cache = {} # from index to (point_set, cls) tuple

        if shuffle is None:
            if split == 'train': self.shuffle = True
            else: self.shuffle = False
        else:
            self.shuffle = shuffle

        self.reset()

    def _augment_batch_data(self, batch_data):    
        jittered_data = provider.jitter_point_cloud(jittered_data)
        rotated_data[:,:,0:3] = jittered_data
        return provider.shuffle_points(rotated_data)


    def _get_item(self, index): 
        if index in self.cache:
            point_set, cls = self.cache[index]
        else:
            fn = self.datapath[index]
            cls = self.classes[self.datapath[index][0]]
            cls = np.array([cls]).astype(np.int32)
            #point_set = np.loadtxt(fn[1],delimiter=',').astype(np.float32)
            point_set = np.load(fn[1]).astype(np.float32)
            # Take the first npoints
            point_set = point_set[0:self.npoints,:]
            if self.normalize:
                point_set[:,0:3] = pc_normalize(point_set[:,0:3])
            if not self.normal_channel:
                point_set = point_set[:,0:3]
            if len(self.cache) < self.cache_size:
                self.cache[index] = (point_set, cls)

        full_point_set = np.zeros((self.npoints, 3))  #upsamping to npoints
        full_point_set[0:point_set.shape[0],0:3] = point_set
        return full_point_set, cls

    def __getitem__(self, index):
        return self._get_item(index)

    def __len__(self):
        return len(self.datapath)

    def num_channel(self):
        if self.normal_channel:
            return 6
        else:
            return 3

    def reset(self):
        self.idxs = np.arange(0, len(self.datapath))
        if self.shuffle:
            np.random.shuffle(self.idxs)
        self.num_batches = (len(self.datapath)+self.batch_size-1) // self.batch_size
        self.batch_idx = 0

    def has_next_batch(self):
        return self.batch_idx < self.num_batches

    def next_batch(self, augment=False):
        ''' returned dimension may be smaller than self.batch_size '''
        start_idx = self.batch_idx * self.batch_size
        end_idx = min((self.batch_idx+1) * self.batch_size, len(self.datapath))
        bsize = end_idx - start_idx
        batch_data = np.zeros((bsize, self.npoints, self.num_channel()))
        batch_label = np.zeros((bsize), dtype=np.int32)
        for i in range(bsize):
            ps,cls = self._get_item(self.idxs[i+start_idx])
            batch_data[i] = ps
            batch_label[i] = cls
        self.batch_idx += 1
        if augment: batch_data = self._augment_batch_data(batch_data)
        return batch_data, batch_label

if __name__ == '__main__':
    d = ModelNetDataset(root = '../data/modelnet40_normal_resampled', split='test')
    print(d.shuffle)
    print(len(d))
    import time
    tic = time.time()
    for i in range(10):
        ps, cls = d[i]
    print(time.time() - tic)
    print(ps.shape, type(ps), cls)

    print(d.has_next_batch())
    ps_batch, cls_batch = d.next_batch(True)
    print(ps_batch.shape)
    print(cls_batch.shape)

TRAIN_DATASET = modelnet_dataset.ModelNetDataset(root=DATA_PATH, \
                npoints=NUM_POINT, split='train', normal_channel=FLAGS.normal, batch_size=BATCH_SIZE)
TEST_DATASET = modelnet_dataset.ModelNetDataset(root=DATA_PATH, \    
                npoints=NUM_POINT, split='test', normal_channel=FLAGS.normal, batch_size=BATCH_SIZE)

def train_one_epoch(sess, ops, train_writer):
    ...
    while TRAIN_DATASET.has_next_batch():
        batch_data, batch_label = TRAIN_DATASET.next_batch(augment=True)

    ...


    TRAIN_DATASET.reset(

2. tf.data API 이용

2.1 tf.data.Dataset

가. Creating a source

- tf.data.Dataset.from_tensors()
- tf.data.dataset.from_tensor_slices(np_features, np_labels)

- 바로 입력 (2GB제한)

dataset = tf.data.Dataset.from_tensor_slices((features, labels))

- placeholder로 입력

features_placeholder = tf.placeholder(features.dtype, features.shape)
labels_placeholder = tf.placeholder(labels.dtype, labels.shape)

dataset = tf.data.Dataset.from_tensor_slices((features_placeholder, labels_placeholder))
## 사용시 
iterator = dataset.make_initializable_iterator()

sess.run(iterator.initializer, feed_dict={features_placeholder: features,
                                          labels_placeholder: labels})

- 파일명 / 전처리 후 입력


def _read_py_function(filename, label):
  image_decoded = cv2.imread(filename.decode(), cv2.IMREAD_GRAYSCALE)
  return image_decoded, label

filenames = ["/var/data/image1.jpg", "/var/data/image2.jpg", ...]
labels = [0, 37, 29, 1, ...]

dataset = tf.data.Dataset.from_tensor_slices((filenames, labels))
dataset = dataset.map(
    lambda filename, label: tuple(tf.py_func(
        _read_py_function, [filename, label], [tf.uint8, label.dtype])))

- Batch로 입력

batched_dataset = dataset.batch(4)
#`Dimension(None) OR (??) `에러시 https://github.com/tensorflow/tensorflow/issues/18226
# batched_dataset = dataset.apply(tf.contrib.data.batch_and_drop_remainder(32)) 

# Dim 확인 
print(dataset.output_types) 
print(dataset.output_shapes) 

iterator = batched_dataset.make_one_shot_iterator()
next_element = iterator.get_next()

나. Applying a transformation : transform Dataset into a new Dataset

- (e.g. Dataset.batch())
- Dataset.map()

2.2 tf.data.Iterator

The most common way to consume values from a Dataset is to make an iterator object

Dataset.make_one_shot_iterator() #Estimator에서 유일게 지원
Iterator.initializer # feed-dict과 쓰일때 유용 sess.run(iterator.initializer, feed_dict={max_value: 10})
Iterator.get_next()

dataset = tf.data.Dataset.range(100)
iterator = dataset.make_one_shot_iterator()
next_element = iterator.get_next()

for i in range(100):
  value = sess.run(next_element)
  assert i == value

results matching ""

No results matching ""