Fix tests and adjust input functions

guptapriya · guptapriya · commit 31649444e22e · 2018-05-05T15:09:51.000-07:00
diff --git a/official/resnet/cifar10_main.py b/official/resnet/cifar10_main.py
@@ -106,16 +106,16 @@ def preprocess_image(image, is_training):
   return image
 
 
-def input_fn(is_training, data_dir, global_batch_size, num_epochs=1,
-             num_gpus=1, datasets_num_private_threads=None):
+def input_fn(is_training, data_dir, global_batch_size,
+             num_gpus, num_epochs=1, datasets_num_private_threads=None):
   """Input_fn using the tf.data input pipeline for CIFAR-10 dataset.
 
   Args:
     is_training: A boolean denoting whether the input is for training.
     data_dir: The directory containing the input data.
     global_batch_size: The number of samples per batch.
-    num_epochs: The number of epochs to repeat the dataset.
     num_gpus: The number of GPUs.
+    num_epochs: The number of epochs to repeat the dataset.
     datasets_num_private_threads: Number of threads for a private
       threadpool created for all datasets computation.
 
@@ -128,7 +128,7 @@ def input_fn(is_training, data_dir, global_batch_size, num_epochs=1,
 
   return resnet_run_loop.process_record_dataset(
       dataset, is_training, global_batch_size, _NUM_IMAGES['train'],
-      parse_record, num_epochs, num_gpus, datasets_num_private_threads
+      parse_record, num_gpus, num_epochs, datasets_num_private_threads
   )
 
 
diff --git a/official/resnet/cifar10_test.py b/official/resnet/cifar10_test.py
@@ -64,21 +64,21 @@ def test_dataset_input_fn(self):
         lambda val: cifar10_main.parse_record(val, False))
     image, label = fake_dataset.make_one_shot_iterator().get_next()
 
-    self.assertAllEqual(label.shape, (10,))
+    self.assertAllEqual(label.shape, ())
     self.assertAllEqual(image.shape, (_HEIGHT, _WIDTH, _NUM_CHANNELS))
 
     with self.test_session() as sess:
       image, label = sess.run([image, label])
 
-      self.assertAllEqual(label, np.array([int(i == 7) for i in range(10)]))
+      self.assertEqual(label, 7)
 
       for row in image:
         for pixel in row:
           self.assertAllClose(pixel, np.array([-1.225, 0., 1.225]), rtol=1e-3)
 
   def cifar10_model_fn_helper(self, mode, resnet_version, dtype):
     input_fn = cifar10_main.get_synth_input_fn()
-    dataset = input_fn(True, '', _BATCH_SIZE)
+    dataset = input_fn(True, '', _BATCH_SIZE, 1)
     iterator = dataset.make_one_shot_iterator()
     features, labels = iterator.get_next()
     spec = cifar10_main.cifar10_model_fn(
diff --git a/official/resnet/imagenet_main.py b/official/resnet/imagenet_main.py
@@ -155,16 +155,16 @@ def parse_record(raw_record, is_training):
   return image, label
 
 
-def input_fn(is_training, data_dir, global_batch_size, num_epochs=1,
-             num_gpus=1, datasets_num_private_threads=None):
+def input_fn(is_training, data_dir, global_batch_size,
+             num_gpus, num_epochs=1, datasets_num_private_threads=None):
   """Input function which provides batches for train or eval.
 
   Args:
     is_training: A boolean denoting whether the input is for training.
     data_dir: The directory containing the input data.
     global_batch_size: The number of samples per batch.
-    num_epochs: The number of epochs to repeat the dataset.
     num_gpus: The number of GPUs.
+    num_epochs: The number of epochs to repeat the dataset.
     datasets_num_private_threads: Number of threads for a private
       threadpool created for all datasets computation.
 
@@ -184,7 +184,7 @@ def input_fn(is_training, data_dir, global_batch_size, num_epochs=1,
 
   return resnet_run_loop.process_record_dataset(
       dataset, is_training, global_batch_size, _SHUFFLE_BUFFER, parse_record,
-      num_epochs, num_gpus, datasets_num_private_threads
+      num_gpus, num_epochs, datasets_num_private_threads
   )
 
 
diff --git a/official/resnet/imagenet_test.py b/official/resnet/imagenet_test.py
@@ -192,7 +192,7 @@ def resnet_model_fn_helper(self, mode, resnet_version, dtype):
     tf.train.create_global_step()
 
     input_fn = imagenet_main.get_synth_input_fn()
-    dataset = input_fn(True, '', _BATCH_SIZE)
+    dataset = input_fn(True, '', _BATCH_SIZE, 1)
     iterator = dataset.make_one_shot_iterator()
     features, labels = iterator.get_next()
     spec = imagenet_main.imagenet_model_fn(
diff --git a/official/resnet/resnet_run_loop.py b/official/resnet/resnet_run_loop.py
@@ -40,8 +40,8 @@
 # Functions for input processing.
 ################################################################################
 def process_record_dataset(dataset, is_training, global_batch_size,
-                           shuffle_buffer, parse_record_fn, num_epochs=1,
-                           num_gpus=1, datasets_num_private_threads=None):
+                           shuffle_buffer, parse_record_fn, num_gpus,
+                           num_epochs=1, datasets_num_private_threads=None):
   """Given a Dataset with raw records, return an iterator over the records.
 
   Args:
@@ -53,8 +53,8 @@ def process_record_dataset(dataset, is_training, global_batch_size,
       time and use less memory.
     parse_record_fn: A function that takes a raw record and returns the
       corresponding (image, label) pair.
-    num_epochs: The number of epochs to repeat the dataset.
     num_gpus: The number of GPUs.
+    num_epochs: The number of epochs to repeat the dataset.
     datasets_num_private_threads: Number of threads for a private 
       threadpool created for all datasets computation.
 
@@ -121,7 +121,9 @@ def get_synth_input_fn(height, width, num_channels, num_classes):
     An input_fn that can be used in place of a real one to return a dataset
     that can be used for iteration.
   """
-  def input_fn(is_training, data_dir, batch_size, *args, **kwargs):  # pylint: disable=unused-argument
+  def input_fn(is_training, data_dir, global_batch_size, num_gpus, 
+               *args, **kwargs):  # pylint: disable=unused-argument
+    batch_size=per_device_batch_size(global_batch_size, num_gpus)
     images = tf.zeros((batch_size, height, width, num_channels), tf.float32)
     labels = tf.zeros((batch_size), tf.int32)
     return tf.data.Dataset.from_tensors((images, labels)).repeat()
@@ -366,7 +368,7 @@ def resnet_main(
   # Using the Winograd non-fused algorithms provides a small performance boost.
   os.environ['TF_ENABLE_WINOGRAD_NONFUSED'] = '1'
   os.environ['TF_GPU_THREAD_MODE'] = flags_obj.tf_gpu_thread_mode
-  os.environ['TF_GPU_THREAD_COUNT'] = flags_obj.tf_gpu_thread_count
+  os.environ['TF_GPU_THREAD_COUNT'] = str(flags_obj.tf_gpu_thread_count)
 
 
   # Create session config based on values of inter_op_parallelism_threads and
@@ -378,13 +380,15 @@ def resnet_main(
       intra_op_parallelism_threads=flags_obj.intra_op_parallelism_threads,
       allow_soft_placement=True)
 
-  if flags_core.get_num_gpus(flags_obj) == 0:
+  num_gpus = flags_core.get_num_gpus(flags_obj)
+
+  if num_gpus == 0:
     distribution = tf.contrib.distribute.OneDeviceStrategy('device:CPU:0')
-  elif flags_core.get_num_gpus(flags_obj) == 1:
+  elif num_gpus == 1:
     distribution = tf.contrib.distribute.OneDeviceStrategy('device:GPU:0')
   else:
     distribution = tf.contrib.distribute.MirroredStrategy(
-        num_gpus=flags_core.get_num_gpus(flags_obj)
+        num_gpus=num_gpus
     )
 
   run_config = tf.estimator.RunConfig(train_distribute=distribution,
@@ -419,17 +423,21 @@ def resnet_main(
 
   def input_fn_train():
     return input_function(
-        is_training=True, data_dir=flags_obj.data_dir,
+        is_training=True,
+        data_dir=flags_obj.data_dir,
         global_batch_size=flags_obj.batch_size, 
+        num_gpus=num_gpus,
         num_epochs=flags_obj.epochs_between_evals,
-        num_gpus=flags_core.get_num_gpus(flags_obj))
+        datasets_num_private_threads=flags_obj.datasets_num_private_threads)
 
   def input_fn_eval():
     return input_function(
-        is_training=False, data_dir=flags_obj.data_dir,
+        is_training=False,
+        data_dir=flags_obj.data_dir,
         global_batch_size=flags_obj.batch_size,
+        num_gpus=num_gpus,
         num_epochs=1,
-        num_gpus=flags_core.get_num_gpus(flags_obj))
+        datasets_num_private_threads=flags_obj.datasets_num_private_threads)
 
 
   total_training_cycle = (flags_obj.train_epochs //
diff --git a/official/utils/flags/_performance.py b/official/utils/flags/_performance.py
@@ -135,7 +135,7 @@ def _check_loss_scale(loss_scale):  # pylint: disable=unused-variable
     flags.DEFINE_string(
         name="tf_gpu_thread_mode", short_name="gt_mode", default="global",
         help=help_wrap(
-             "Whether and how the GPU device uses its own threadpool.")
+            "Whether and how the GPU device uses its own threadpool.")
     )
 
   if tf_gpu_thread_count:
@@ -149,8 +149,8 @@ def _check_loss_scale(loss_scale):  # pylint: disable=unused-variable
         name="datasets_num_private_threads", short_name="dataset_thread_count",
         default=None,
         help=help_wrap(
-             "Number of threads for a private threadpool created for all"
-             "datasets computation..")
+            "Number of threads for a private threadpool created for all"
+            "datasets computation..")
     )
 
   return key_flags