thuml
diff --git a/‎README.md‎
Lines changed: 2 additions & 2 deletions b/‎README.md‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎dataloader/dataset.py‎ ‎dataloader.py‎dataloader/dataset.py renamed to dataloader.py
Lines changed: 61 additions & 39 deletions b/‎dataloader/dataset.py‎ ‎dataloader.py‎dataloader/dataset.py renamed to dataloader.py
Lines changed: 61 additions & 39 deletions
diff --git a/‎dataloader/__init__.py‎
Lines changed: 0 additions & 1 deletion b/‎dataloader/__init__.py‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎dataloader/cifar10.py‎
Lines changed: 0 additions & 30 deletions b/‎dataloader/cifar10.py‎
Lines changed: 0 additions & 30 deletions
diff --git a/‎dataloader/coco.py‎
Lines changed: 0 additions & 31 deletions b/‎dataloader/coco.py‎
Lines changed: 0 additions & 31 deletions
diff --git a/‎dataloader/nuswide81.py‎
Lines changed: 0 additions & 32 deletions b/‎dataloader/nuswide81.py‎
Lines changed: 0 additions & 32 deletions
diff --git a/‎main.py‎
Lines changed: 7 additions & 9 deletions b/‎main.py‎
Lines changed: 7 additions & 9 deletions
diff --git a/‎util.py‎
Lines changed: 0 additions & 8 deletions b/‎util.py‎
Lines changed: 0 additions & 8 deletions
@@ -33,15 +33,15 @@ If you need run on NUSWIDE_81 and COCO, we recommend you to follow https://githu
 
 - [ ] Pretrain model of Alexnet
 - [ ] pretrained G model
-- [ ] resume training
 - [ ] eval frequence & eval at last iter
-- [ ] training longger
 - [ ] refactor all 
   - [ ] use config instead of constant
   - [ ] use no split
   - [ ] evaluate mode
   - [ ] output dir which contains images, models, logs
     - [ ] mkdir automatically
+- [ ] training longger
+- [ ] resume training
 - [ ] rerun all process on a fresh machine
 
 Configuration for th models is specified in a list of constants at the top of
 
@@ -87,43 +87,65 @@ def get_labels(self):
         return np.asarray(self._label)
 
 
-def data_generator(batch_size, width_height, file_name):
-    _dataset = Dataset(file_name, True, width_height)
-
-    def get_epoch():
-
-        _index_in_epoch = 0
-        _perm = np.arange(_dataset.n_samples)
-        np.random.shuffle(_perm)
-        for _ in range(int(math.ceil(_dataset.n_samples / batch_size))):
-            start = _index_in_epoch
-            _index_in_epoch += batch_size
-            # finish one epoch
-            if _index_in_epoch > _dataset.n_samples:
-                data, label = _dataset.data(_perm[start:])
-                data1, label1 = _dataset.data(
-                    _perm[:_index_in_epoch - _dataset.n_samples])
-                data = np.concatenate([data, data1], axis=0)
-                label = np.concatenate([label, label1], axis=0)
-            else:
-                end = _index_in_epoch
-                data, label = _dataset.data(_perm[start:end])
-
-            # n*h*w*c -> n*c*h*w
-            data = np.transpose(data, (0, 3, 1, 2))
-            # bgr -> rgb
-            data = data[:, ::-1, :, :]
-            data = np.reshape(data, (batch_size, -1))
-            yield (data, label)
-
-    return get_epoch
-
-
-def load_train(batch_size, width_height, data_root):
-    return [data_generator(batch_size, width_height, os.path.join(data_root, split + '.txt'))
-            for split in ["train", "database_nolabel", "test"]]
-
-def load_val(batch_size, width_height, data_root):
-    return [data_generator(batch_size, width_height, os.path.join(data_root, split + '.txt'))
-            for split in ["database", "test.txt"]]
+class Dataloader(object):
+
+    def __init__(self, batch_size, width_height, data_root):
+        self.batch_size = batch_size
+        self.width_height = width_height
+        self.data_root = data_root
+    
+    def data_generator(self, split):
+        file_name = os.path.join(self.data_root, split + '.txt')
+        _dataset = Dataset(file_name, True, self.width_height)
+
+        def get_epoch():
+
+            _index_in_epoch = 0
+            _perm = np.arange(_dataset.n_samples)
+            np.random.shuffle(_perm)
+            for _ in range(int(math.ceil(_dataset.n_samples / self.batch_size))):
+                start = _index_in_epoch
+                _index_in_epoch += self.batch_size
+                # finish one epoch
+                if _index_in_epoch > _dataset.n_samples:
+                    data, label = _dataset.data(_perm[start:])
+                    data1, label1 = _dataset.data(
+                        _perm[:_index_in_epoch - _dataset.n_samples])
+                    data = np.concatenate([data, data1], axis=0)
+                    label = np.concatenate([label, label1], axis=0)
+                else:
+                    end = _index_in_epoch
+                    data, label = _dataset.data(_perm[start:end])
+
+                # n*h*w*c -> n*c*h*w
+                data = np.transpose(data, (0, 3, 1, 2))
+                # bgr -> rgb
+                data = data[:, ::-1, :, :]
+                data = np.reshape(data, (self.batch_size, -1))
+                yield (data, label)
+
+        return get_epoch
 
+    @property
+    def train_gen(self):
+        return self.data_generator('train')
+
+    @property
+    def test_gen(self):
+        return self.data_generator('test')
+
+    @property
+    def db_gen(self):
+        return self.data_generator('database')
+
+    @property
+    def unlabeled_db_gen(self):
+        return self.data_generator('database_nolabel')
+
+    @staticmethod
+    def inf_gen(gen):
+        def generator():
+            while True:
+                for images_iter_, labels_iter_ in gen():
+                    return images_iter_, labels_iter_
+        return generator
@@ -20,7 +20,7 @@
 import tensorflow as tf
 from tensorflow.python.client import device_lib
 
-import dataloader
+from dataloader import Dataloader
 import tflib as lib
 import tflib.plot
 import tflib.save_images
@@ -33,9 +33,9 @@
 
 
 def main(cfg):
-    dataset = dataloader.__dict__[cfg.DATA.USE_DATASET]
     DEVICES = [x.name for x in device_lib.list_local_devices()
                if x.device_type == 'GPU']
+    dataloader = Dataloader(cfg.DATA.BATCH_SIZE, cfg.DATA.WIDTH_HEIGHT, cfg.DATA.DATA_ROOT)
 
     configProto = tf.ConfigProto()
     configProto.gpu_options.allow_growth = True
@@ -309,9 +309,8 @@ def generate_image(frame):
             lib.save_images.save_images(samples.reshape((100, 3, cfg.DATA.WIDTH_HEIGHT, cfg.DATA.WIDTH_HEIGHT)),
                                         '{}/samples_{}.png'.format(cfg.DATA.IMAGE_DIR, frame))
 
-        train_gen, unlabel_train_gen, dev_gen = dataset.load(cfg.TRAIN.BATCH_SIZE, cfg.DATA.WIDTH_HEIGHT)
-        gen = util.inf_gen(train_gen)
-        unlabel_gen = util.inf_gen(unlabel_train_gen)
+        gen = dataloader.inf_gen(dataloader.train_gen)
+        unlabel_gen = dataloader.inf_gen(dataloader.unlabeled_db_gen)
 
         util.print_param_size(gen_gv, disc_gv)
 
@@ -378,19 +377,18 @@ def generate_image(frame):
 
             # calculate mAP score w.r.t all db data every 10000 config.TRAIN.ITERS
             if (iteration + 1) % 10000 == 0:
-                _db_gen, _test_gen = dataset.load_val(cfg.TRAIN.BATCH_SIZE, cfg.DATA.WIDTH_HEIGHT)
                 db_output = []
                 db_labels = []
                 test_output = []
                 test_labels = []
-                for images, _labels in _test_gen():
-                    _disc_acgan_output, __cost = session.run([disc_real_acgan, disc_real_acgan_cost],
+                for images, _labels in dataloader.test_gen():
+                    _disc_acgan_output, _ = session.run([disc_real_acgan, disc_real_acgan_cost],
                                                              feed_dict={all_real_data_int: images,
                                                                         all_real_labels: _labels})
                     test_output.append(_disc_acgan_output)
                     test_labels.append(_labels)
 
-                for images, _labels in _db_gen():
+                for images, _labels in dataloader.db_gen():
                     _disc_acgan_output, _ = session.run([disc_real_acgan, disc_real_acgan_cost],
                                                         feed_dict={all_real_data_int: images, all_real_labels: _labels})
                     db_output.append(_disc_acgan_output)
 
@@ -8,14 +8,6 @@
 import locale
 
 
-def inf_gen(gen):
-    def generator():
-        while True:
-            for images_iter_, labels_iter_ in gen():
-                return images_iter_, labels_iter_
-    return generator
-
-
 # compute param size
 def print_param_size(gen_gv, disc_gv):
     print("computing param size")