ipcoder
diff --git a/‎official/recommendation/constants.py
+6 b/‎official/recommendation/constants.py
+6
diff --git a/‎official/recommendation/data_async_generation.py
+17-3 b/‎official/recommendation/data_async_generation.py
+17-3
diff --git a/‎official/recommendation/data_preprocessing.py
+15-4 b/‎official/recommendation/data_preprocessing.py
+15-4
diff --git a/‎official/recommendation/data_test.py
+3-2 b/‎official/recommendation/data_test.py
+3-2
@@ -52,6 +52,12 @@ def __init__(self, data_dir, cache_id=None):
 # when performing evaluation.
 NUM_EVAL_NEGATIVES = 999
 
+# keys for evaluation metrics
+TOP_K = 10  # Top-k list for evaluation
+HR_KEY = "HR"
+NDCG_KEY = "NDCG"
+DUPLICATE_MASK = "duplicate_mask"
+
 # ==============================================================================
 # == Subprocess Data Generation ================================================
 # ==============================================================================
 
@@ -124,7 +124,7 @@ def _process_shard(args):
   return users_out, items_out, labels_out
 
 
-def _construct_record(users, items, labels=None):
+def _construct_record(users, items, labels=None, dupe_mask=None):
   """Convert NumPy arrays into a TFRecords entry."""
   feature_dict = {
       movielens.USER_COLUMN: tf.train.Feature(
@@ -136,6 +136,10 @@ def _construct_record(users, items, labels=None):
     feature_dict["labels"] = tf.train.Feature(
         bytes_list=tf.train.BytesList(value=[memoryview(labels).tobytes()]))
 
+  if dupe_mask is not None:
+    feature_dict[rconst.DUPLICATE_MASK] = tf.train.Feature(
+        bytes_list=tf.train.BytesList(value=[memoryview(dupe_mask).tobytes()]))
+
   return tf.train.Example(
       features=tf.train.Features(feature=feature_dict)).SerializeToString()
 
@@ -305,6 +309,9 @@ def _construct_training_records(
 def _construct_eval_record(cache_paths, eval_batch_size):
   """Convert Eval data to a single TFRecords file."""
 
+  # Later logic assumes that all items for a given user are in the same batch.
+  assert not eval_batch_size % (rconst.NUM_EVAL_NEGATIVES + 1)
+
   log_msg("Beginning construction of eval TFRecords file.")
   raw_fpath = cache_paths.eval_raw_file
   intermediate_fpath = cache_paths.eval_record_template_temp
@@ -332,9 +339,16 @@ def _construct_eval_record(cache_paths, eval_batch_size):
   num_batches = users.shape[0]
   with tf.python_io.TFRecordWriter(intermediate_fpath) as writer:
     for i in range(num_batches):
+      batch_users = users[i, :]
+      batch_items = items[i, :]
+      dupe_mask = stat_utils.mask_duplicates(
+          batch_items.reshape(-1, rconst.NUM_EVAL_NEGATIVES + 1),
+          axis=1).flatten().astype(np.int8)
+
       batch_bytes = _construct_record(
-          users=users[i, :],
-          items=items[i, :]
+          users=batch_users,
+          items=batch_items,
+          dupe_mask=dupe_mask
       )
       writer.write(batch_bytes)
   tf.gfile.Rename(intermediate_fpath, dest_fpath)
 
@@ -27,6 +27,7 @@
 import os
 import pickle
 import signal
+import socket
 import subprocess
 import time
 import timeit
@@ -399,10 +400,14 @@ def _shutdown(proc):
   """Convenience function to cleanly shut down async generation process."""
 
   tf.logging.info("Shutting down train data creation subprocess.")
-  proc.send_signal(signal.SIGINT)
-  time.sleep(1)
-  if proc.returncode is not None:
-    return  # SIGINT was handled successfully within 1 sec
+  try:
+    proc.send_signal(signal.SIGINT)
+    time.sleep(1)
+    if proc.returncode is not None:
+      return  # SIGINT was handled successfully within 1 sec
+
+  except socket.error:
+    pass
 
   # Otherwise another second of grace period and then forcibly kill the process.
   time.sleep(1)
@@ -493,6 +498,8 @@ def make_deserialize(params, batch_size, training=False):
   }
   if training:
     feature_map["labels"] = tf.FixedLenFeature([], dtype=tf.string)
+  else:
+    feature_map[rconst.DUPLICATE_MASK] = tf.FixedLenFeature([], dtype=tf.string)
 
   def deserialize(examples_serialized):
     """Called by Dataset.map() to convert batches of records to tensors."""
@@ -506,13 +513,17 @@ def deserialize(examples_serialized):
       items = tf.cast(items, tf.int32)  # TPU doesn't allow uint16 infeed.
 
     if not training:
+      dupe_mask = tf.reshape(tf.cast(tf.decode_raw(
+          features[rconst.DUPLICATE_MASK], tf.int8), tf.bool), (batch_size,))
       return {
           movielens.USER_COLUMN: users,
           movielens.ITEM_COLUMN: items,
+          rconst.DUPLICATE_MASK: dupe_mask,
       }
 
     labels = tf.reshape(tf.cast(tf.decode_raw(
         features["labels"], tf.int8), tf.bool), (batch_size,))
+
     return {
         movielens.USER_COLUMN: users,
         movielens.ITEM_COLUMN: items,
 
@@ -36,6 +36,7 @@
 NUM_ITEMS = 2000
 NUM_PTS = 50000
 BATCH_SIZE = 2048
+EVAL_BATCH_SIZE = 4000
 NUM_NEG = 4
 
 
@@ -112,8 +113,8 @@ def drain_dataset(self, dataset, g):
   def test_end_to_end(self):
     ncf_dataset, _ = data_preprocessing.instantiate_pipeline(
         dataset=DATASET, data_dir=self.temp_data_dir,
-        batch_size=BATCH_SIZE, eval_batch_size=BATCH_SIZE, num_data_readers=2,
-        num_neg=NUM_NEG)
+        batch_size=BATCH_SIZE, eval_batch_size=EVAL_BATCH_SIZE,
+        num_data_readers=2, num_neg=NUM_NEG)
 
     g = tf.Graph()
     with g.as_default():