top-k label ouput

윤영빈
Commit 1b4cf2a2d2844f9b27cd4bcf3801efcbad630941 1b4cf2a2 1 parent e4adf017
Showing 1 changed file with 366 additions and 340 deletions
web/backend/yt8m/inference_per_segment.py
--- a/web/backend/yt8m/inference_per_segment.py
View file @1b4cf2a
+++ b/web/backend/yt8m/inference_per_segment.py
View file @1b4cf2a
@@ -34,366 +34,392 @@ from tensorflow import logging
 from tensorflow.python.lib.io import file_io
 import utils
 from collections import Counter
+import operator
 FLAGS = flags.FLAGS
 if __name__ == "__main__":
-    # Input
+  # Input
-    flags.DEFINE_string(
+  flags.DEFINE_string(
-        "train_dir", "", "The directory to load the model files from. We assume "
+      "train_dir", "", "The directory to load the model files from. We assume "
-                         "that you have already run eval.py onto this, such that "
+      "that you have already run eval.py onto this, such that "
-                         "inference_model.* files already exist.")
+      "inference_model.* files already exist.")
-    flags.DEFINE_string(
+  flags.DEFINE_string(
-        "input_data_pattern", "",
+      "input_data_pattern", "",
-        "File glob defining the evaluation dataset in tensorflow.SequenceExample "
+      "File glob defining the evaluation dataset in tensorflow.SequenceExample "
-        "format. The SequenceExamples are expected to have an 'rgb' byte array "
+      "format. The SequenceExamples are expected to have an 'rgb' byte array "
-        "sequence feature as well as a 'labels' int64 context feature.")
+      "sequence feature as well as a 'labels' int64 context feature.")
-    flags.DEFINE_string(
+  flags.DEFINE_string(
-        "input_model_tgz", "",
+      "input_model_tgz", "",
-        "If given, must be path to a .tgz file that was written "
+      "If given, must be path to a .tgz file that was written "
-        "by this binary using flag --output_model_tgz. In this "
+      "by this binary using flag --output_model_tgz. In this "
-        "case, the .tgz file will be untarred to "
+      "case, the .tgz file will be untarred to "
-        "--untar_model_dir and the model will be used for "
+      "--untar_model_dir and the model will be used for "
-        "inference.")
+      "inference.")
-    flags.DEFINE_string(
+  flags.DEFINE_string(
-        "untar_model_dir", "/tmp/yt8m-model",
+      "untar_model_dir", "/tmp/yt8m-model",
-        "If --input_model_tgz is given, then this directory will "
+      "If --input_model_tgz is given, then this directory will "
-        "be created and the contents of the .tgz file will be "
+      "be created and the contents of the .tgz file will be "
-        "untarred here.")
+      "untarred here.")
-    flags.DEFINE_bool(
+  flags.DEFINE_bool(
-        "segment_labels", False,
+      "segment_labels", False,
-        "If set, then --input_data_pattern must be frame-level features (but with"
+      "If set, then --input_data_pattern must be frame-level features (but with"
-        " segment_labels). Otherwise, --input_data_pattern must be aggregated "
+      " segment_labels). Otherwise, --input_data_pattern must be aggregated "
-        "video-level features. The model must also be set appropriately (i.e. to "
+      "video-level features. The model must also be set appropriately (i.e. to "
-        "read 3D batches VS 4D batches.")
+      "read 3D batches VS 4D batches.")
-    flags.DEFINE_integer("segment_max_pred", 100000,
+  flags.DEFINE_integer("segment_max_pred", 100000,
-                         "Limit total number of segment outputs per entity.")
+                       "Limit total number of segment outputs per entity.")
-    flags.DEFINE_string(
+  flags.DEFINE_string(
-        "segment_label_ids_file",
+      "segment_label_ids_file",
-        "https://raw.githubusercontent.com/google/youtube-8m/master/segment_label_ids.csv",
+      "https://raw.githubusercontent.com/google/youtube-8m/master/segment_label_ids.csv",
-        "The file that contains the segment label ids.")
+      "The file that contains the segment label ids.")
-
+
-    # Output
+  # Output
-    flags.DEFINE_string("output_file", "", "The file to save the predictions to.")
+  flags.DEFINE_string("output_file", "", "The file to save the predictions to.")
-    flags.DEFINE_string(
+  flags.DEFINE_string(
-        "output_model_tgz", "",
+      "output_model_tgz", "",
-        "If given, should be a filename with a .tgz extension, "
+      "If given, should be a filename with a .tgz extension, "
-        "the model graph and checkpoint will be bundled in this "
+      "the model graph and checkpoint will be bundled in this "
-        "gzip tar. This file can be uploaded to Kaggle for the "
+      "gzip tar. This file can be uploaded to Kaggle for the "
-        "top 10 participants.")
+      "top 10 participants.")
-    flags.DEFINE_integer("top_k", 1, "How many predictions to output per video.")
+  flags.DEFINE_integer("top_k", 5, "How many predictions to output per video.")
-
+
-    # Other flags.
+  # Other flags.
-    flags.DEFINE_integer("batch_size", 512,
+  flags.DEFINE_integer("batch_size", 512,
-                         "How many examples to process per batch.")
+                       "How many examples to process per batch.")
-    flags.DEFINE_integer("num_readers", 1,
+  flags.DEFINE_integer("num_readers", 1,
-                         "How many threads to use for reading input files.")
+                       "How many threads to use for reading input files.")
 def format_lines(video_ids, predictions, top_k, whitelisted_cls_mask=None):
-    """Create an information line the submission file."""
+  """Create an information line the submission file."""
-    batch_size = len(video_ids)
+  batch_size = len(video_ids)
-    for video_index in range(batch_size):
+  for video_index in range(batch_size):
-        video_prediction = predictions[video_index]
+    video_prediction = predictions[video_index]
-        if whitelisted_cls_mask is not None:
+    if whitelisted_cls_mask is not None:
-            # Whitelist classes.
+      # Whitelist classes.
-            video_prediction *= whitelisted_cls_mask
+      video_prediction *= whitelisted_cls_mask
-        top_indices = np.argpartition(video_prediction, -top_k)[-top_k:]
+    top_indices = np.argpartition(video_prediction, -top_k)[-top_k:]
-        line = [(class_index, predictions[video_index][class_index])
+    line = [(class_index, predictions[video_index][class_index])
-                for class_index in top_indices]
+            for class_index in top_indices]
-        line = sorted(line, key=lambda p: -p[1])
+    line = sorted(line, key=lambda p: -p[1])
-        yield (video_ids[video_index] + "," +
+    yield (video_ids[video_index] + "," +
-               " ".join("%i %g" % (label, score) for (label, score) in line) +
+           " ".join("%i %g" % (label, score) for (label, score) in line) +
-               "\n").encode("utf8")
+           "\n").encode("utf8")
 def get_input_data_tensors(reader, data_pattern, batch_size, num_readers=1):
-    """Creates the section of the graph which reads the input data.
+  """Creates the section of the graph which reads the input data.
-
+
-    Args:
+  Args:
-      reader: A class which parses the input data.
+    reader: A class which parses the input data.
-      data_pattern: A 'glob' style path to the data files.
+    data_pattern: A 'glob' style path to the data files.
-      batch_size: How many examples to process at a time.
+    batch_size: How many examples to process at a time.
-      num_readers: How many I/O threads to use.
+    num_readers: How many I/O threads to use.
-
+
-    Returns:
+  Returns:
-      A tuple containing the features tensor, labels tensor, and optionally a
+    A tuple containing the features tensor, labels tensor, and optionally a
-      tensor containing the number of frames per video. The exact dimensions
+    tensor containing the number of frames per video. The exact dimensions
-      depend on the reader being used.
+    depend on the reader being used.
-
+
-    Raises:
+  Raises:
-      IOError: If no files matching the given pattern were found.
+    IOError: If no files matching the given pattern were found.
-    """
+  """
-    with tf.name_scope("input"):
+  with tf.name_scope("input"):
-        files = gfile.Glob(data_pattern)
+    files = gfile.Glob(data_pattern)
-        if not files:
+    if not files:
-            raise IOError("Unable to find input files. data_pattern='" +
+      raise IOError("Unable to find input files. data_pattern='" +
-                          data_pattern + "'")
+                    data_pattern + "'")
-        logging.info("number of input files: " + str(len(files)))
+    logging.info("number of input files: " + str(len(files)))
-        filename_queue = tf.train.string_input_producer(files,
+    filename_queue = tf.train.string_input_producer(files,
-                                                        num_epochs=1,
+                                                    num_epochs=1,
-                                                        shuffle=False)
+                                                    shuffle=False)
-        examples_and_labels = [
+    examples_and_labels = [
-            reader.prepare_reader(filename_queue) for _ in range(num_readers)
+        reader.prepare_reader(filename_queue) for _ in range(num_readers)
-        ]
+    ]
-
+
-        input_data_dict = (tf.train.batch_join(examples_and_labels,
+    input_data_dict = (tf.train.batch_join(examples_and_labels,
-                                               batch_size=batch_size,
+                                           batch_size=batch_size,
-                                               allow_smaller_final_batch=True,
+                                           allow_smaller_final_batch=True,
-                                               enqueue_many=True))
+                                           enqueue_many=True))
-        video_id_batch = input_data_dict["video_ids"]
+    video_id_batch = input_data_dict["video_ids"]
-        video_batch = input_data_dict["video_matrix"]
+    video_batch = input_data_dict["video_matrix"]
-        num_frames_batch = input_data_dict["num_frames"]
+    num_frames_batch = input_data_dict["num_frames"]
-        return video_id_batch, video_batch, num_frames_batch
+    return video_id_batch, video_batch, num_frames_batch
 def get_segments(batch_video_mtx, batch_num_frames, segment_size):
-    """Get segment-level inputs from frame-level features."""
+  """Get segment-level inputs from frame-level features."""
-    video_batch_size = batch_video_mtx.shape[0]
+  video_batch_size = batch_video_mtx.shape[0]
-    max_frame = batch_video_mtx.shape[1]
+  max_frame = batch_video_mtx.shape[1]
-    feature_dim = batch_video_mtx.shape[-1]
+  feature_dim = batch_video_mtx.shape[-1]
-    padded_segment_sizes = (batch_num_frames + segment_size - 1) // segment_size
+  padded_segment_sizes = (batch_num_frames + segment_size - 1) // segment_size
-    padded_segment_sizes *= segment_size
+  padded_segment_sizes *= segment_size
-    segment_mask = (
+  segment_mask = (
-            0 < (padded_segment_sizes[:, np.newaxis] - np.arange(0, max_frame)))
+      0 < (padded_segment_sizes[:, np.newaxis] - np.arange(0, max_frame)))
-
+
-    # Segment bags.
+  # Segment bags.
-    frame_bags = batch_video_mtx.reshape((-1, feature_dim))
+  frame_bags = batch_video_mtx.reshape((-1, feature_dim))
-    segment_frames = frame_bags[segment_mask.reshape(-1)].reshape(
+  segment_frames = frame_bags[segment_mask.reshape(-1)].reshape(
-        (-1, segment_size, feature_dim))
+      (-1, segment_size, feature_dim))
-
+
-    # Segment num frames.
+  # Segment num frames.
-    segment_start_times = np.arange(0, max_frame, segment_size)
+  segment_start_times = np.arange(0, max_frame, segment_size)
-    num_segments = batch_num_frames[:, np.newaxis] - segment_start_times
+  num_segments = batch_num_frames[:, np.newaxis] - segment_start_times
-    num_segment_bags = num_segments.reshape((-1))
+  num_segment_bags = num_segments.reshape((-1))
-    valid_segment_mask = num_segment_bags > 0
+  valid_segment_mask = num_segment_bags > 0
-    segment_num_frames = num_segment_bags[valid_segment_mask]
+  segment_num_frames = num_segment_bags[valid_segment_mask]
-    segment_num_frames[segment_num_frames > segment_size] = segment_size
+  segment_num_frames[segment_num_frames > segment_size] = segment_size
-
+
-    max_segment_num = (max_frame + segment_size - 1) // segment_size
+  max_segment_num = (max_frame + segment_size - 1) // segment_size
-    video_idxs = np.tile(
+  video_idxs = np.tile(
-        np.arange(0, video_batch_size)[:, np.newaxis], [1, max_segment_num])
+      np.arange(0, video_batch_size)[:, np.newaxis], [1, max_segment_num])
-    segment_idxs = np.tile(segment_start_times, [video_batch_size, 1])
+  segment_idxs = np.tile(segment_start_times, [video_batch_size, 1])
-    idx_bags = np.stack([video_idxs, segment_idxs], axis=-1).reshape((-1, 2))
+  idx_bags = np.stack([video_idxs, segment_idxs], axis=-1).reshape((-1, 2))
-    video_segment_ids = idx_bags[valid_segment_mask]
+  video_segment_ids = idx_bags[valid_segment_mask]
-
+
-    return {
+  return {
-        "video_batch": segment_frames,
+      "video_batch": segment_frames,
-        "num_frames_batch": segment_num_frames,
+      "num_frames_batch": segment_num_frames,
-        "video_segment_ids": video_segment_ids
+      "video_segment_ids": video_segment_ids
-    }
+  }
 def inference(reader, train_dir, data_pattern, out_file_location, batch_size,
               top_k):
-    """Inference function."""
+  """Inference function."""
-    with tf.Session(config=tf.ConfigProto(
+  with tf.Session(config=tf.ConfigProto(
-            allow_soft_placement=True)) as sess, gfile.Open(out_file_location,
+      allow_soft_placement=True)) as sess, gfile.Open(out_file_location,
-                                                            "w+") as out_file:
+                                                      "w+") as out_file:
-        video_id_batch, video_batch, num_frames_batch = get_input_data_tensors(
+    video_id_batch, video_batch, num_frames_batch = get_input_data_tensors(
-            reader, data_pattern, batch_size)
+        reader, data_pattern, batch_size)
-        inference_model_name = "segment_inference_model" if FLAGS.segment_labels else "inference_model"
+    inference_model_name = "segment_inference_model" if FLAGS.segment_labels else "inference_model"
-        checkpoint_file = os.path.join(train_dir, "inference_model",
+    checkpoint_file = os.path.join(train_dir, "inference_model",
-                                       inference_model_name)
+                                   inference_model_name)
-        if not gfile.Exists(checkpoint_file + ".meta"):
+    if not gfile.Exists(checkpoint_file + ".meta"):
-            raise IOError("Cannot find %s. Did you run eval.py?" % checkpoint_file)
+      raise IOError("Cannot find %s. Did you run eval.py?" % checkpoint_file)
-        meta_graph_location = checkpoint_file + ".meta"
+    meta_graph_location = checkpoint_file + ".meta"
-        logging.info("loading meta-graph: " + meta_graph_location)
+    logging.info("loading meta-graph: " + meta_graph_location)
-
+
-        if FLAGS.output_model_tgz:
+    if FLAGS.output_model_tgz:
-            with tarfile.open(FLAGS.output_model_tgz, "w:gz") as tar:
+      with tarfile.open(FLAGS.output_model_tgz, "w:gz") as tar:
-                for model_file in glob.glob(checkpoint_file + ".*"):
+        for model_file in glob.glob(checkpoint_file + ".*"):
-                    tar.add(model_file, arcname=os.path.basename(model_file))
+          tar.add(model_file, arcname=os.path.basename(model_file))
-                tar.add(os.path.join(train_dir, "model_flags.json"),
+        tar.add(os.path.join(train_dir, "model_flags.json"),
-                        arcname="model_flags.json")
+                arcname="model_flags.json")
-            print("Tarred model onto " + FLAGS.output_model_tgz)
+      print("Tarred model onto " + FLAGS.output_model_tgz)
-        with tf.device("/cpu:0"):
+    with tf.device("/cpu:0"):
-            saver = tf.train.import_meta_graph(meta_graph_location,
+      saver = tf.train.import_meta_graph(meta_graph_location,
-                                               clear_devices=True)
+                                         clear_devices=True)
-        logging.info("restoring variables from " + checkpoint_file)
+    logging.info("restoring variables from " + checkpoint_file)
-        saver.restore(sess, checkpoint_file)
+    saver.restore(sess, checkpoint_file)
-        input_tensor = tf.get_collection("input_batch_raw")[0]
+    input_tensor = tf.get_collection("input_batch_raw")[0]
-        num_frames_tensor = tf.get_collection("num_frames")[0]
+    num_frames_tensor = tf.get_collection("num_frames")[0]
-        predictions_tensor = tf.get_collection("predictions")[0]
+    predictions_tensor = tf.get_collection("predictions")[0]
-
+
-        # Workaround for num_epochs issue.
+    # Workaround for num_epochs issue.
-        def set_up_init_ops(variables):
+    def set_up_init_ops(variables):
-            init_op_list = []
+      init_op_list = []
-            for variable in list(variables):
+      for variable in list(variables):
-                if "train_input" in variable.name:
+        if "train_input" in variable.name:
-                    init_op_list.append(tf.assign(variable, 1))
+          init_op_list.append(tf.assign(variable, 1))
-                    variables.remove(variable)
+          variables.remove(variable)
-            init_op_list.append(tf.variables_initializer(variables))
+      init_op_list.append(tf.variables_initializer(variables))
-            return init_op_list
+      return init_op_list
-
+
-        sess.run(
+    sess.run(
-            set_up_init_ops(tf.get_collection_ref(tf.GraphKeys.LOCAL_VARIABLES)))
+        set_up_init_ops(tf.get_collection_ref(tf.GraphKeys.LOCAL_VARIABLES)))
-
+
-        coord = tf.train.Coordinator()
+    coord = tf.train.Coordinator()
-        threads = tf.train.start_queue_runners(sess=sess, coord=coord)
+    threads = tf.train.start_queue_runners(sess=sess, coord=coord)
-        num_examples_processed = 0
+    num_examples_processed = 0
-        start_time = time.time()
+    start_time = time.time()
-        whitelisted_cls_mask = None
+    whitelisted_cls_mask = None
+    if FLAGS.segment_labels:
+      final_out_file = out_file
+      out_file = tempfile.NamedTemporaryFile()
+      logging.info(
+          "Segment temp prediction output will be written to temp file: %s",
+          out_file.name)
+      if FLAGS.segment_label_ids_file:
+        whitelisted_cls_mask = np.zeros((predictions_tensor.get_shape()[-1],),
+                                        dtype=np.float32)
+        segment_label_ids_file = FLAGS.segment_label_ids_file
+        if segment_label_ids_file.startswith("http"):
+          logging.info("Retrieving segment ID whitelist files from %s...",
+                       segment_label_ids_file)
+          segment_label_ids_file, _ = urllib.request.urlretrieve(
+              segment_label_ids_file)
+        with tf.io.gfile.GFile(segment_label_ids_file) as fobj:
+          for line in fobj:
+            try:
+              cls_id = int(line)
+              whitelisted_cls_mask[cls_id] = 1.
+            except ValueError:
+              # Simply skip the non-integer line.
+              continue
+
+    out_file.write(u"VideoId,LabelConfidencePairs\n".encode("utf8"))
+    
+    #=========================================
+    #open vocab csv file and store to dictionary
+    #=========================================
+    voca_dict = {}
+    vocabs = open("./vocabulary.csv", 'r')
+    while True:
+      line = vocabs.readline()
+      if not line: break
+      vocab_dict_item = line.split(",")
+      if vocab_dict_item[0] != "Index":
+        voca_dict[vocab_dict_item[0]] = vocab_dict_item[3]
+    vocabs.close()
+    try:
+      while not coord.should_stop():
+        video_id_batch_val, video_batch_val, num_frames_batch_val = sess.run(
+            [video_id_batch, video_batch, num_frames_batch])
         if FLAGS.segment_labels:
-            final_out_file = out_file
+          results = get_segments(video_batch_val, num_frames_batch_val, 5)
-            out_file = tempfile.NamedTemporaryFile()
+          video_segment_ids = results["video_segment_ids"]
-            logging.info(
+          video_id_batch_val = video_id_batch_val[video_segment_ids[:, 0]]
-                "Segment temp prediction output will be written to temp file: %s",
+          video_id_batch_val = np.array([
-                out_file.name)
+              "%s:%d" % (x.decode("utf8"), y)
-            if FLAGS.segment_label_ids_file:
+              for x, y in zip(video_id_batch_val, video_segment_ids[:, 1])
-                whitelisted_cls_mask = np.zeros((predictions_tensor.get_shape()[-1],),
+          ])
-                                                dtype=np.float32)
+          video_batch_val = results["video_batch"]
-                segment_label_ids_file = FLAGS.segment_label_ids_file
+          num_frames_batch_val = results["num_frames_batch"]
-                if segment_label_ids_file.startswith("http"):
+          if input_tensor.get_shape()[1] != video_batch_val.shape[1]:
-                    logging.info("Retrieving segment ID whitelist files from %s...",
+            raise ValueError("max_frames mismatch. Please re-run the eval.py "
-                                 segment_label_ids_file)
+                             "with correct segment_labels settings.")
-                    segment_label_ids_file, _ = urllib.request.urlretrieve(
+
-                        segment_label_ids_file)
+        predictions_val, = sess.run([predictions_tensor],
-                with tf.io.gfile.GFile(segment_label_ids_file) as fobj:
+                                    feed_dict={
-                    for line in fobj:
+                                        input_tensor: video_batch_val,
-                        try:
+                                        num_frames_tensor: num_frames_batch_val
-                            cls_id = int(line)
+                                    })
-                            whitelisted_cls_mask[cls_id] = 1.
+        now = time.time()
-                        except ValueError:
+        num_examples_processed += len(video_batch_val)
-                            # Simply skip the non-integer line.
+        elapsed_time = now - start_time
-                            continue
+        logging.info("num examples processed: " + str(num_examples_processed) +
-
+                     " elapsed seconds: " + "{0:.2f}".format(elapsed_time) +
-        out_file.write(u"VideoId,LabelConfidencePairs\n".encode("utf8"))
+                     " examples/sec: %.2f" %
-
+                     (num_examples_processed / elapsed_time))
-        try:
+        for line in format_lines(video_id_batch_val, predictions_val, top_k,
-            while not coord.should_stop():
+                                 whitelisted_cls_mask):
-                video_id_batch_val, video_batch_val, num_frames_batch_val = sess.run(
+          out_file.write(line)
-                    [video_id_batch, video_batch, num_frames_batch])
+        out_file.flush()
-                if FLAGS.segment_labels:
+
-                    results = get_segments(video_batch_val, num_frames_batch_val, 5)
+    except tf.errors.OutOfRangeError:
-                    video_segment_ids = results["video_segment_ids"]
+      logging.info("Done with inference. The output file was written to " +
-                    video_id_batch_val = video_id_batch_val[video_segment_ids[:, 0]]
+                   out_file.name)
-                    video_id_batch_val = np.array([
+    finally:
-                        "%s:%d" % (x.decode("utf8"), y)
+      coord.request_stop()
-                        for x, y in zip(video_id_batch_val, video_segment_ids[:, 1])
+
-                    ])
+      if FLAGS.segment_labels:
-                    video_batch_val = results["video_batch"]
+        # Re-read the file and do heap sort.
-                    num_frames_batch_val = results["num_frames_batch"]
+        # Create multiple heaps.
-                    if input_tensor.get_shape()[1] != video_batch_val.shape[1]:
+        logging.info("Post-processing segment predictions...")
-                        raise ValueError("max_frames mismatch. Please re-run the eval.py "
+        segment_id_list = []
-                                         "with correct segment_labels settings.")
+        segment_classes = []
-
+        cls_result_arr = []
-                predictions_val, = sess.run([predictions_tensor],
+        cls_score_dict = {}
-                                            feed_dict={
+        out_file.seek(0, 0)
-                                                input_tensor: video_batch_val,
+        old_seg_name = '0000'
-                                                num_frames_tensor: num_frames_batch_val
+        for line in out_file:
-                                            })
+          segment_id, preds = line.decode("utf8").split(",")
-                now = time.time()
+          if segment_id == "VideoId":
-                num_examples_processed += len(video_batch_val)
+            # Skip the headline.
-                elapsed_time = now - start_time
+            continue
-                logging.info("num examples processed: " + str(num_examples_processed) +
+
-                             " elapsed seconds: " + "{0:.2f}".format(elapsed_time) +
+          preds = preds.split(" ")
-                             " examples/sec: %.2f" %
+          pred_cls_ids = [int(preds[idx]) for idx in range(0, len(preds), 2)]
-                             (num_examples_processed / elapsed_time))
+          pred_cls_scores = [float(preds[idx]) for idx in range(1, len(preds), 2)]
-                for line in format_lines(video_id_batch_val, predictions_val, top_k,
+        #=======================================
-                                         whitelisted_cls_mask):
+          segment_id = str(segment_id.split(":")[0])
-                    out_file.write(line)
+          if segment_id not in segment_id_list:
-                out_file.flush()
+                segment_id_list.append(str(segment_id))
-
+                segment_classes.append("")
-        except tf.errors.OutOfRangeError:
+
-            logging.info("Done with inference. The output file was written to " +
+          index = segment_id_list.index(segment_id)
-                         out_file.name)
+          
-        finally:
+          if old_seg_name != segment_id:
-            coord.request_stop()
+            cls_score_dict[segment_id] = {}
-
+            old_seg_name = segment_id
-            if FLAGS.segment_labels:
+          
-                # Re-read the file and do heap sort.
+          for classes in range(0,len(pred_cls_ids)):#pred_cls_ids:
-                # Create multiple heaps.
+                segment_classes[index] = str(segment_classes[index]) + str(pred_cls_ids[classes]) + " " #append classes from new segment
-                logging.info("Post-processing segment predictions...")
+                if pred_cls_ids[classes] in cls_score_dict[segment_id]:
-                segment_id_list = []
+                  cls_score_dict[segment_id][pred_cls_ids[classes]] = cls_score_dict[segment_id][pred_cls_ids[classes]] + pred_cls_scores[classes]
-                segment_classes = []
+                else:
-                cls_result_arr = []
+                  cls_score_dict[segment_id][pred_cls_ids[classes]] = pred_cls_scores[classes]
-                out_file.seek(0, 0)
+
-                for line in out_file:
+        for segs,item in zip(segment_id_list,segment_classes):
-                    segment_id, preds = line.decode("utf8").split(",")
+          print('====== R E C O R D ======')
-                    if segment_id == "VideoId":
+          cls_arr = item.split(" ")[:-1]
-                        # Skip the headline.
+          
-                        continue
+          cls_arr = list(map(int,cls_arr))      
-
+          cls_arr = sorted(cls_arr) #클래스별로 정렬
-                    preds = preds.split(" ")
+          
-                    pred_cls_ids = [int(preds[idx]) for idx in range(0, len(preds), 2)]
+          result_string = ""
-                    # =======================================
+          
-                    segment_id = str(segment_id.split(":")[0])
+          temp = cls_score_dict[segs]
-                    if segment_id not in segment_id_list:
+          temp= sorted(temp.items(), key=operator.itemgetter(1), reverse=True) #밸류값 기준으로 정렬
-                        segment_id_list.append(str(segment_id))
+          demoninator = float(temp[0][1] + temp[1][1] + temp[2][1] + temp[3][1] + temp[4][1])
-                        segment_classes.append("")
+          #for item in temp: 
-
+          for itemIndex in range(0, top_k):
-                    index = segment_id_list.index(segment_id)
+            result_string = result_string + str(voca_dict[str(temp[itemIndex][0])]) + ":" + format(temp[itemIndex][1]/demoninator,".3f") + ","
-                    for classes in pred_cls_ids:
+          
-                        segment_classes[index] = str(segment_classes[index]) + str(
+          cls_result_arr.append(result_string[:-1])
-                            classes) + " "  # append classes from new segment
+          logging.info(segs + " : " + result_string[:-1])
-
+        #=======================================
-                for segs, item in zip(segment_id_list, segment_classes):
+        final_out_file.write("vid_id,seg_classes\n")
-                    print('====== R E C O R D ======')
+        for seg_id, class_indcies in zip(segment_id_list, cls_result_arr):
-                    cls_arr = item.split(" ")[:-1]
+          final_out_file.write("%s,%s\n" %(seg_id, str(class_indcies)))
-
+        final_out_file.close()
-                    cls_arr = list(map(int, cls_arr))
+
-                    cls_arr = sorted(cls_arr)
+      out_file.close()
-
+
-                    result_string = ""
+    coord.join(threads)
-
+    sess.close()
-                    temp = Counter(cls_arr)
-                    for item in temp:
-                        result_string = result_string + str(item) + ":" + str(temp[item]) + ","
-
-                    cls_result_arr.append(result_string[:-1])
-                    logging.info(segs + " : " + result_string[:-1])
-                # =======================================
-                final_out_file.write("vid_id,seg_classes\n")
-                for seg_id, class_indcies in zip(segment_id_list, cls_result_arr):
-                    final_out_file.write("%s,%s\n" % (seg_id, str(class_indcies)))
-                final_out_file.close()
-
-            out_file.close()
-
-        coord.join(threads)
-        sess.close()
-
 def main(unused_argv):
-    logging.set_verbosity(tf.logging.INFO)
+  logging.set_verbosity(tf.logging.INFO)
-    if FLAGS.input_model_tgz:
+  if FLAGS.input_model_tgz:
-        if FLAGS.train_dir:
+    if FLAGS.train_dir:
-            raise ValueError("You cannot supply --train_dir if supplying "
+      raise ValueError("You cannot supply --train_dir if supplying "
-                             "--input_model_tgz")
+                       "--input_model_tgz")
-        # Untar.
+    # Untar.
-        if not os.path.exists(FLAGS.untar_model_dir):
+    if not os.path.exists(FLAGS.untar_model_dir):
-            os.makedirs(FLAGS.untar_model_dir)
+      os.makedirs(FLAGS.untar_model_dir)
-        tarfile.open(FLAGS.input_model_tgz).extractall(FLAGS.untar_model_dir)
+    tarfile.open(FLAGS.input_model_tgz).extractall(FLAGS.untar_model_dir)
-        FLAGS.train_dir = FLAGS.untar_model_dir
+    FLAGS.train_dir = FLAGS.untar_model_dir
-
+
-    flags_dict_file = os.path.join(FLAGS.train_dir, "model_flags.json")
+  flags_dict_file = os.path.join(FLAGS.train_dir, "model_flags.json")
-    if not file_io.file_exists(flags_dict_file):
+  if not file_io.file_exists(flags_dict_file):
-        raise IOError("Cannot find %s. Did you run eval.py?" % flags_dict_file)
+    raise IOError("Cannot find %s. Did you run eval.py?" % flags_dict_file)
-    flags_dict = json.loads(file_io.FileIO(flags_dict_file, "r").read())
+  flags_dict = json.loads(file_io.FileIO(flags_dict_file, "r").read())
-
+
-    # convert feature_names and feature_sizes to lists of values
+  # convert feature_names and feature_sizes to lists of values
-    feature_names, feature_sizes = utils.GetListOfFeatureNamesAndSizes(
+  feature_names, feature_sizes = utils.GetListOfFeatureNamesAndSizes(
-        flags_dict["feature_names"], flags_dict["feature_sizes"])
+      flags_dict["feature_names"], flags_dict["feature_sizes"])
-
+
-    if flags_dict["frame_features"]:
+  if flags_dict["frame_features"]:
-        reader = readers.YT8MFrameFeatureReader(feature_names=feature_names,
+    reader = readers.YT8MFrameFeatureReader(feature_names=feature_names,
-                                                feature_sizes=feature_sizes)
+                                            feature_sizes=feature_sizes)
-    else:
+  else:
-        reader = readers.YT8MAggregatedFeatureReader(feature_names=feature_names,
+    reader = readers.YT8MAggregatedFeatureReader(feature_names=feature_names,
-                                                     feature_sizes=feature_sizes)
+                                                 feature_sizes=feature_sizes)
-
+
-    if not FLAGS.output_file:
+  if not FLAGS.output_file:
-        raise ValueError("'output_file' was not specified. "
+    raise ValueError("'output_file' was not specified. "
-                         "Unable to continue with inference.")
+                     "Unable to continue with inference.")
-
+
-    if not FLAGS.input_data_pattern:
+  if not FLAGS.input_data_pattern:
-        raise ValueError("'input_data_pattern' was not specified. "
+    raise ValueError("'input_data_pattern' was not specified. "
-                         "Unable to continue with inference.")
+                     "Unable to continue with inference.")
-
+
-    inference(reader, FLAGS.train_dir, FLAGS.input_data_pattern,
+  inference(reader, FLAGS.train_dir, FLAGS.input_data_pattern,
-              FLAGS.output_file, FLAGS.batch_size, FLAGS.top_k)
+            FLAGS.output_file, FLAGS.batch_size, FLAGS.top_k)
 if __name__ == "__main__":
-    app.run()
+  app.run()