Robinatp · Oct 24, 2018
diff --git a/‎DeepLab_inference_Demo.py
+223 b/‎DeepLab_inference_Demo.py
+223
diff --git a/‎core/feature_extractor_demo.py
+89 b/‎core/feature_extractor_demo.py
+89
diff --git a/‎core/resnet_v1_beta.py
+517 b/‎core/resnet_v1_beta.py
+517
diff --git a/‎core/resnet_v1_beta_demo.py
+77 b/‎core/resnet_v1_beta_demo.py
+77
diff --git a/‎core/xception_demo.py
+79 b/‎core/xception_demo.py
+79
diff --git a/‎dataset/segmentation_vis_demo.py
+23-13 b/‎dataset/segmentation_vis_demo.py
+23-13
diff --git a/‎dataset/tfrecord_mask_demo.py
+255 b/‎dataset/tfrecord_mask_demo.py
+255
diff --git a/‎tf_record_mask_decode_and_preprocess_demo.py
+223 b/‎tf_record_mask_decode_and_preprocess_demo.py
+223
diff --git a/‎tf_record_mask_decode_demo.py
+158 b/‎tf_record_mask_decode_demo.py
+158
@@ -0,0 +1,223 @@
+import os
+from io import BytesIO
+import tarfile
+import tempfile
+from six.moves import urllib
+
+from matplotlib import gridspec
+from matplotlib import pyplot as plt
+import numpy as np
+from PIL import Image
+import cv2
+
+import tensorflow as tf
+import time
+from datetime import datetime
+
+slim = tf.contrib.slim
+
+
+class DeepLabModel(object):
+  """Class to load deeplab model and run inference."""
+
+  INPUT_TENSOR_NAME = 'ImageTensor:0'
+  OUTPUT_TENSOR_NAME = 'SemanticPredictions:0'
+  INPUT_SIZE = 513
+  FROZEN_GRAPH_NAME = 'frozen_inference_graph.pb'
+
+  def __init__(self, modir_dir):
+    """Creates and loads pretrained deeplab model."""
+    self.graph = tf.Graph()
+
+    graph_def = None
+    with tf.gfile.GFile(os.path.join(modir_dir,self.FROZEN_GRAPH_NAME), "rb") as f:
+        graph_def = tf.GraphDef()
+        graph_def.ParseFromString(f.read())  
+
+    if graph_def is None:
+      raise RuntimeError('Cannot find inference graph in tar archive.')
+
+    with self.graph.as_default():
+      tf.import_graph_def(graph_def, name='')
+      
+    self.sess = tf.Session(graph=self.graph)
+    
+    ops = self.sess.graph.get_operations()
+    for op in ops:
+            print(op.name)
+            
+
+    writer = tf.summary.FileWriter("./logs", graph=self.graph)
+    writer.close()
+
+  def run(self, image):
+    """Runs inference on a single image.
+
+    Args:
+      image: A PIL.Image object, raw input image.
+
+    Returns:
+      resized_image: RGB image resized from original input image.
+      seg_map: Segmentation map of `resized_image`.
+    """
+    width, height = image.size
+    resize_ratio = 1.0 * self.INPUT_SIZE / max(width, height)
+    target_size = (int(resize_ratio * width), int(resize_ratio * height))
+    print("origin_size:",image.size,"  target_size:",target_size)
+    resized_image = image.convert('RGB').resize(target_size, Image.ANTIALIAS)
+    
+    start_time = time.time()
+    batch_seg_map = self.sess.run(
+        self.OUTPUT_TENSOR_NAME,
+        feed_dict={self.INPUT_TENSOR_NAME: [np.asarray(resized_image)]})
+    duration = time.time() - start_time
+          
+    print ('%s: , duration = %.3f s ' %(datetime.now(), duration))
+    
+    seg_map = batch_seg_map[0]
+    return resized_image, seg_map
+
+
+def create_pascal_label_colormap():
+  """Creates a label colormap used in PASCAL VOC segmentation benchmark.
+
+  Returns:
+    A Colormap for visualizing segmentation results.
+  """
+  colormap = np.zeros((256, 3), dtype=int)
+  ind = np.arange(256, dtype=int)
+
+  for shift in reversed(range(8)):
+    for channel in range(3):
+      colormap[:, channel] |= ((ind >> channel) & 1) << shift
+    ind >>= 3
+
+  return colormap
+
+
+def label_to_color_image(label):
+  """Adds color defined by the dataset colormap to the label.
+
+  Args:
+    label: A 2D array with integer type, storing the segmentation label.
+
+  Returns:
+    result: A 2D array with floating type. The element of the array
+      is the color indexed by the corresponding element in the input label
+      to the PASCAL color map.
+
+  Raises:
+    ValueError: If label is not of rank 2 or its value is larger than color
+      map maximum entry.
+  """
+  if label.ndim != 2:
+    raise ValueError('Expect 2-D input label')
+
+  colormap = create_pascal_label_colormap()
+
+  if np.max(label) >= len(colormap):
+    raise ValueError('label value too large.')
+
+  return colormap[label]
+
+
+def vis_segmentation(image, seg_map):
+  """Visualizes input image, segmentation map and overlay view."""
+  plt.figure(figsize=(15, 5))
+  grid_spec = gridspec.GridSpec(1, 4, width_ratios=[6, 6, 6, 1])
+
+  plt.subplot(grid_spec[0])
+  plt.imshow(image)
+  plt.axis('off')
+  plt.title('input image')
+
+  plt.subplot(grid_spec[1])
+  seg_image = label_to_color_image(seg_map).astype(np.uint8)
+  plt.imshow(seg_image)
+  plt.axis('off')
+  plt.title('segmentation map')
+
+  plt.subplot(grid_spec[2])
+  plt.imshow(image)
+  plt.imshow(seg_image, alpha=0.7)
+  plt.axis('off')
+  plt.title('segmentation overlay')
+
+  unique_labels = np.unique(seg_map)
+  ax = plt.subplot(grid_spec[3])
+  plt.imshow(
+      FULL_COLOR_MAP[unique_labels].astype(np.uint8), interpolation='nearest')
+  ax.yaxis.tick_right()
+  plt.yticks(range(len(unique_labels)), LABEL_NAMES[unique_labels])
+  plt.xticks([], [])
+  ax.tick_params(width=0.0)
+  plt.grid('off')
+  plt.show()
+
+def run_visualization(deeplab,image_dir):
+  """Inferences DeepLab model and visualizes result."""
+  
+  image_files = tf.gfile.Glob(image_dir+"*.jpg")
+  print(image_files)
+  
+  for file in image_files:
+      with tf.gfile.FastGFile(file) as f:
+          original_im = Image.open(BytesIO(f.read()))
+      
+      resized_im, seg_map = MODEL.run(original_im)
+    
+#       vis_segmentation(resized_im, seg_map)
+      
+      image_raw =  cv2.imread(file)
+      image_resize = cv2.resize(image_raw,resized_im.size)
+      cv2.imshow('image_raw',image_resize)
+      
+      colored_label = label_to_color_image(seg_map)
+      colored_label = cv2.cvtColor(colored_label.astype(np.uint8),cv2.COLOR_RGB2BGR)
+      cv2.imshow("colored_label",colored_label)
+            
+      alpha = 0.4
+      img_add = img_add = cv2.addWeighted(image_resize, alpha, colored_label, 1-alpha, 0)
+      cv2.imshow("colored_overlap",img_add)
+      cv2.waitKey(0)
+
+
+
+MODEL_DIR= "/home/robin/Dataset/models/semantic_segmentation/deeplabv3_pascal_trainval_2018_01_04/deeplabv3_pascal_trainval"
+# MODEL_DIR= "/home/robin/Dataset/models/semantic_segmentation/deeplabv3_mnv2_pascal_train_aug_2018_01_29/deeplabv3_mnv2_pascal_train_aug"
+
+flags = tf.app.flags
+
+# Dataset settings.
+flags.DEFINE_string('dataset', 'ade20k',
+                    'Name of the segmentation dataset.')
+
+tf.app.flags.DEFINE_string(
+    'test_path', 'images_demo/', 'Test image path.')
+
+flags.DEFINE_string('train_split', 'train',
+                    'Which split of the dataset to be used for training')
+
+flags.DEFINE_string('modir_dir', MODEL_DIR, 'Where the Model reside.')
+
+FLAGS = flags.FLAGS
+
+LABEL_NAMES = np.asarray([
+    'background', 'aeroplane', 'bicycle', 'bird', 'boat', 'bottle', 'bus',
+    'car', 'cat', 'chair', 'cow', 'diningtable', 'dog', 'horse', 'motorbike',
+    'person', 'pottedplant', 'sheep', 'sofa', 'train', 'tv'
+])
+
+FULL_LABEL_MAP = np.arange(len(LABEL_NAMES)).reshape(len(LABEL_NAMES), 1)
+FULL_COLOR_MAP = label_to_color_image(FULL_LABEL_MAP)
+
+
+if __name__ == "__main__":
+    MODEL = DeepLabModel(FLAGS.modir_dir)
+    print('model loaded successfully!')
+    
+    run_visualization(MODEL,FLAGS.test_path)
+    
+    
+    
+    
@@ -0,0 +1,89 @@
+
+
+"""Tests for xception.py."""
+import numpy as np
+import six
+import tensorflow as tf
+import time
+from datetime import datetime
+
+import sys
+import os
+# This is needed since the notebook is stored in the object_detection folder.
+TF_API="/home/robin/eclipse-workspace-python/TF_models/models/research"
+sys.path.append(os.path.split(TF_API)[0])
+sys.path.append(TF_API)
+
+from deeplab.core import feature_extractor
+
+slim = tf.contrib.slim
+
+
+
+
+flags = tf.app.flags
+
+# For `xception_65`, use atrous_rates = [12, 24, 36] if output_stride = 8, or
+# rates = [6, 12, 18] if output_stride = 16. For `mobilenet_v2`, use None. Note
+# one could use different atrous_rates/output_stride during training/evaluation.
+flags.DEFINE_multi_integer('atrous_rates', None,
+                           'Atrous rates for atrous spatial pyramid pooling.')
+flags.DEFINE_integer('output_stride', 8,
+                     'The ratio of input to output spatial resolution.')
+
+# Defaults to None. Set multi_grid = [1, 2, 4] when using provided
+# 'resnet_v1_{50,101}_beta' checkpoints.
+flags.DEFINE_multi_integer('multi_grid', None,
+                           'Employ a hierarchy of atrous rates for ResNet.')
+
+# When using 'mobilent_v2', we set atrous_rates = decoder_output_stride = None.
+# When using 'xception_65' or 'resnet_v1' model variants, we set
+# atrous_rates = [6, 12, 18] (output stride 16) and decoder_output_stride = 4.
+# See core/feature_extractor.py for supported model variants.
+flags.DEFINE_string('model_variant', 'xception_65', 'DeepLab model variant.')
+
+flags.DEFINE_float('depth_multiplier', 1.0,
+                   'Multiplier for the depth (number of channels) for all '
+                   'convolution ops used in MobileNet.')
+
+
+
+
+FLAGS = flags.FLAGS
+
+
+if __name__ == '__main__':
+    
+    images = tf.random_normal([1, 513, 513, 3])
+
+
+    features, end_points = feature_extractor.extract_features(
+          images,
+          output_stride=FLAGS.output_stride,
+          multi_grid=FLAGS.multi_grid,
+          model_variant=FLAGS.model_variant,
+          depth_multiplier=FLAGS.depth_multiplier,
+          weight_decay=0.0001,
+          reuse=None,
+          is_training=False,
+          fine_tune_batch_norm=False)
+    
+    
+    print(features, end_points)
+    
+    writer = tf.summary.FileWriter("./logs", graph=tf.get_default_graph())
+    
+    
+    print("Layers")
+    for k, v in end_points.items():
+        print('name = {}, shape = {}'.format(v.name, v.get_shape()))
+      
+    print("Parameters")
+    for v in slim.get_model_variables():
+        print('name = {}, shape = {}'.format(v.name, v.get_shape())) 
+    
+    
+    
+    
+    
+    
@@ -0,0 +1,77 @@
+# Copyright 2018 The TensorFlow Authors All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+"""Tests for xception.py."""
+import numpy as np
+import six
+import tensorflow as tf
+import time
+from datetime import datetime
+
+import sys
+import os
+# This is needed since the notebook is stored in the object_detection folder.
+TF_API="/home/robin/eclipse-workspace-python/TF_models/models/research"
+sys.path.append(os.path.split(TF_API)[0])
+sys.path.append(TF_API)
+
+from deeplab.core import resnet_v1_beta
+from tensorflow.contrib.slim.nets import resnet_utils
+
+slim = tf.contrib.slim
+
+
+
+
+
+if __name__ == '__main__':
+    inputs = tf.random_normal([1, 224, 224, 3])
+    
+    
+    with slim.arg_scope(resnet_utils.resnet_arg_scope()):
+    
+        net, end_points = resnet_v1_beta.resnet_v1_101(inputs,
+                 num_classes=100,
+                 is_training=False,
+                 global_pool=True,
+                 output_stride=None,
+                 multi_grid=None,
+                 reuse=None,
+                 scope='resnet_v1_101')
+   
+    writer = tf.summary.FileWriter("./logs", graph=tf.get_default_graph())
+    
+    
+    print("Layers")
+    for k, v in end_points.items():
+        print('name = {}, shape = {}'.format(v.name, v.get_shape()))
+      
+#     print("Parameters")
+#     for v in slim.get_model_variables():
+#         print('name = {}, shape = {}'.format(v.name, v.get_shape())) 
+    
+    
+    
+    init = tf.global_variables_initializer()
+    with tf.Session() as sess:
+        sess.run(init)
+        
+        for i in range(10):
+            start_time = time.time()
+            _ = sess.run(net)
+            duration = time.time() - start_time
+            print ('%s: step %d, duration = %.3f' %(datetime.now(), i, duration))
+            
+            
@@ -0,0 +1,79 @@
+# Copyright 2018 The TensorFlow Authors All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+"""Tests for xception.py."""
+import numpy as np
+import six
+import tensorflow as tf
+import time
+from datetime import datetime
+
+import sys
+import os
+# This is needed since the notebook is stored in the object_detection folder.
+TF_API="/home/robin/eclipse-workspace-python/TF_models/models/research"
+sys.path.append(os.path.split(TF_API)[0])
+sys.path.append(TF_API)
+
+from deeplab.core import xception
+from tensorflow.contrib.slim.nets import resnet_utils
+
+slim = tf.contrib.slim
+
+
+
+
+
+if __name__ == '__main__':
+    inputs = tf.random_normal([1, 224, 224, 3])
+    
+    
+    with slim.arg_scope(xception.xception_arg_scope()):
+    
+        net, end_points = xception.xception_65(inputs,
+                    num_classes=100,
+                    is_training=False,
+                    global_pool=True,
+                    keep_prob=0.5,
+                    output_stride=None,
+                    regularize_depthwise=False,
+                    multi_grid=[12,16,18],
+                    reuse=None,
+                    scope='xception_65')
+   
+    writer = tf.summary.FileWriter("./logs", graph=tf.get_default_graph())
+    
+    
+    print("Layers")
+    for k, v in end_points.items():
+        print('name = {}, shape = {}'.format(v.name, v.get_shape()))
+      
+#     print("Parameters")
+#     for v in slim.get_model_variables():
+#         print('name = {}, shape = {}'.format(v.name, v.get_shape())) 
+    
+    
+    
+    init = tf.global_variables_initializer()
+    with tf.Session() as sess:
+        sess.run(init)
+        
+        for i in range(10):
+            start_time = time.time()
+            _ = sess.run(net)
+            duration = time.time() - start_time
+            print ('%s: step %d, duration = %.3f' %(datetime.now(), i, duration))
+            
+            
@@ -33,12 +33,12 @@
 FLAGS = tf.app.flags.FLAGS
 
 tf.app.flags.DEFINE_string('original_color_folder',
-                           './battery_word_seg/JPEGImages',
+                           "/home/robin/Dataset/VOC/VOC2012_VOCtrainval/VOC2012/JPEGImages",
                            'Original ground truth annotations.')
 
-tf.app.flags.DEFINE_string('original_gt_folder',
-                           './battery_word_seg/SegmentationClassRaw',
-                           'Original ground truth annotations.')
+tf.app.flags.DEFINE_string('semantic_segmentation_folder',
+                           "/home/robin/Dataset/VOC/VOC2012_VOCtrainval/VOC2012/SegmentationClassRaw",
+                           'Folder containing semantic segmentation annotations.')
 
 tf.app.flags.DEFINE_string('segmentation_format', 'png', 'Segmentation format.')
 
@@ -74,7 +74,7 @@ def _save_annotation(annotation, filename):
 
 def vis_segmentation(image, seg_map):
   """Visualizes input image, segmentation map and overlay view."""
-  plt.figure(figsize=(15, 5))
+  plt.figure(figsize=(16, 8))
   grid_spec = gridspec.GridSpec(1, 4, width_ratios=[6, 6, 6, 1])
 
   plt.subplot(grid_spec[0])
@@ -104,27 +104,37 @@ def main(unused_argv):
 
   if(FLAGS.convert):
 
-    annotations = glob.glob(os.path.join(FLAGS.original_gt_folder,
+    annotations = glob.glob(os.path.join(FLAGS.semantic_segmentation_folder,
                                        '*.' + FLAGS.segmentation_format))
 
 
 
 
     for annotation in annotations:
         print(annotation)
-        #filename = os.path.join(FLAGS.segmentation_output_dir,os.path.basename(annotation)[:-4]+".jpg")
+        
 
         ori_filename = os.path.join(FLAGS.original_color_folder,os.path.basename(annotation)[:-4]+".jpg")
         print(ori_filename)
 #         ori_im =Image.open(ori_filename)
-        orignal_im = cv2.imread(ori_filename)
-        image_RGB = cv2.cvtColor(orignal_im,cv2.COLOR_BGR2RGB)
+        color_im = cv2.imread(ori_filename)
+        rgb_image = cv2.cvtColor(color_im,cv2.COLOR_BGR2RGB)
+        print(rgb_image.shape)
 
-        mask_im = cv2.imread(annotation)
-        print(mask_im.shape)
-        mask_RGB = cv2.cvtColor(mask_im,cv2.COLOR_BGR2RGB)
+        seg_im = cv2.imread(annotation,0)
+        print(seg_im.shape)
+        
+        #dst = src1 * alpha + src2 * beta + gamma;
+        #alpha,beta,gamma
+#         alpha = 0.3
+#         beta = 1-alpha
+#         gamma = 0
+#         img_add = cv2.addWeighted(rgb_image, alpha, seg_im, beta, gamma)
+#         cv2.imshow("image_add",img_add)
+#         cv2.waitKey(0)
+        
 
-        vis_segmentation(orignal_im,mask_RGB)
+        vis_segmentation(rgb_image,seg_im*125)
 
 
 if __name__ == '__main__':
 
@@ -0,0 +1,255 @@
+#coding=utf-8
+import tensorflow as tf
+import sys
+import cv2
+import os
+import matplotlib.pyplot as plt
+from PIL import Image
+import numpy as np
+import csv
+
+# This is needed since the notebook is stored in the object_detection folder.
+TF_API="/home/robin/eclipse-workspace-python/TF_models/models/research"
+sys.path.append(os.path.split(TF_API)[0])
+sys.path.append(TF_API)
+
+from object_detection.utils import visualization_utils as vis_util
+slim = tf.contrib.slim
+
+
+NUM_CLASSES = 20
+SPLITS_TO_SIZES = {
+    'train': 5011,
+    'test': 4952,
+}
+ITEMS_TO_DESCRIPTIONS = {
+    'image': 'A color image of varying height and width.',
+    'shape': 'Shape of the image',
+    'object/bbox': 'A list of bounding boxes, one per each object.',
+    'object/label': 'A list of labels, one per each object.',
+}
+
+labels_to_class =['none','aeroplane', 'bicycle', 'bird', 'boat', 'bottle', 'bus',
+           'car', 'cat', 'chair', 'cow', 'diningtable', 'dog', 'horse',
+           'motorbike', 'person', 'pottedplant', 'sheep', 'sofa',
+           'train', 'tvmonitor']
+
+FILE_PATTERN = 'voc_2007_%s_*.tfrecord'
+
+def _get_output_filename(dataset_dir, split_name):
+    """Creates the output filename.
+    Args:
+      dataset_dir: The dataset directory where the dataset is stored.
+      split_name: The name of the train/test split.
+    Returns:
+      An absolute file path.
+    """
+    return '%s/%s*.tfrecord' % (dataset_dir, split_name)
+
+def bboxes_draw_on_img(img, classes, bboxes, colors, thickness=2):
+    shape = img.shape
+    for i in range(bboxes.shape[0]):
+        bbox = bboxes[i]
+        # Draw bounding box...
+        p1 = (int(bbox[0] * shape[0]), int(bbox[1] * shape[1]))
+        p2 = (int(bbox[2] * shape[0]), int(bbox[3] * shape[1]))
+        cv2.rectangle(img, p1[::-1], p2[::-1], colors, thickness)
+        # Draw text...
+        s = '%s' % (labels_to_class[classes[i]])
+        p1 = (p1[0]+15, p1[1]+5)
+        cv2.putText(img, s, p1[::-1], cv2.FONT_HERSHEY_DUPLEX, 0.4, colors, 1)
+        
+def get_split(split_name, dataset_dir, file_pattern=None, reader=None):
+    """Gets a dataset tuple with instructions
+    Args:
+      split_name: A train/test split name.
+      dataset_dir: The base directory of the dataset sources.
+      file_pattern: The file pattern to use when matching the dataset sources.
+        It is assumed that the pattern contains a '%s' string so that the split
+        name can be inserted.
+      reader: The TensorFlow reader type.
+    Returns:
+      A `Dataset` namedtuple.
+    Raises:
+      ValueError: if `split_name` is not a valid train/test split.
+    """
+    if split_name not in SPLITS_TO_SIZES:
+        raise ValueError('split name %s was not recognized.' % split_name)
+    
+    if not file_pattern:
+        file_pattern = FILE_PATTERN
+    file_pattern = os.path.join(dataset_dir, file_pattern % split_name)
+    
+    # Allowing None in the signature so that dataset_factory can use the default.
+    if reader is None:
+        reader = tf.TFRecordReader
+#     #文件名格式
+#     if file_pattern is None:
+#         file_pattern = _get_output_filename('tfrecords','voc_2007_train')#need fix your filename
+#     print(file_pattern)
+    
+    # 适配器1：将example反序列化成存储之前的格式。由tf完成
+    keys_to_features = {
+        'image/encoded': tf.FixedLenFeature((), tf.string, default_value=''),
+        'image/format': tf.FixedLenFeature((), tf.string, default_value='jpg'),
+        'image/height': tf.FixedLenFeature([1], tf.int64),
+        'image/width': tf.FixedLenFeature([1], tf.int64),
+        'image/channels': tf.FixedLenFeature([1], tf.int64),
+        'image/shape': tf.FixedLenFeature([3], tf.int64),
+        'image/object/bbox/xmin': tf.VarLenFeature(dtype=tf.float32),
+        'image/object/bbox/ymin': tf.VarLenFeature(dtype=tf.float32),
+        'image/object/bbox/xmax': tf.VarLenFeature(dtype=tf.float32),
+        'image/object/bbox/ymax': tf.VarLenFeature(dtype=tf.float32),
+        'image/object/bbox/label': tf.VarLenFeature(dtype=tf.int64),
+        'image/object/bbox/difficult': tf.VarLenFeature(dtype=tf.int64),
+        'image/object/bbox/truncated': tf.VarLenFeature(dtype=tf.int64),
+    }
+    
+    #适配器2：将反序列化的数据组装成更高级的格式。由slim完成
+    items_to_handlers = {
+        'image': slim.tfexample_decoder.Image('image/encoded', 'image/format'),
+        'shape': slim.tfexample_decoder.Tensor('image/shape'),
+        'object/bbox': slim.tfexample_decoder.BoundingBox(
+                ['ymin', 'xmin', 'ymax', 'xmax'], 'image/object/bbox/'),
+        'object/label': slim.tfexample_decoder.Tensor('image/object/bbox/label'),
+        'object/difficult': slim.tfexample_decoder.Tensor('image/object/bbox/difficult'),
+        'object/truncated': slim.tfexample_decoder.Tensor('image/object/bbox/truncated'),
+    }
+    # 解码器
+    decoder = slim.tfexample_decoder.TFExampleDecoder(keys_to_features, items_to_handlers)
+    
+    # dataset对象定义了数据集的文件位置，解码方式等元信息
+    dataset = slim.dataset.Dataset(
+                data_sources=file_pattern,
+                reader=reader,
+                num_samples = SPLITS_TO_SIZES['test'], # 手动生成了三个文件， 每个文件里只包含一个example
+                decoder=decoder,
+                items_to_descriptions = ITEMS_TO_DESCRIPTIONS,
+                num_classes=NUM_CLASSES)
+    return dataset
+
+#读取tfrecords文件
+def decode_from_tfrecords(filename,num_epoch=None):
+    filename_queue=tf.train.string_input_producer([filename],num_epochs=num_epoch)#因为有的训练数据过于庞大，被分成了很多个文件，所以第一个参数就是文件列表名参数
+    reader=tf.TFRecordReader()
+    _,serialized=reader.read(filename_queue)
+    example=tf.parse_single_example(serialized,features={
+        'image/height':tf.FixedLenFeature([],tf.int64),
+        'image/width':tf.FixedLenFeature([],tf.int64),
+        'image/encoded':tf.FixedLenFeature([],tf.string),
+        'image/object/class/label':tf.FixedLenFeature([],tf.int64)
+    })
+    label=tf.cast(example['image/object/class/label'], tf.int32)
+    image=tf.decode_raw(example['image/encoded'],tf.uint8)
+    image=tf.reshape(image,tf.stack([
+        tf.cast(example['image/height'], tf.int32),
+        tf.cast(example['image/width'], tf.int32),
+        3]))
+    
+    print('decode_from_tfrecords: ',image)  
+    print('decode_from_tfrecords: ',label)
+    return image,label
+
+def plt_bboxes(img, classes, scores, bboxes, figsize=(10,10), linewidth=1.5):
+    """Visualize bounding boxes. Largely inspired by SSD-MXNET!
+    """
+    fig = plt.figure(figsize=figsize)
+    plt.imshow(img)
+    height = img.shape[0]
+    width = img.shape[1]
+    colors = dict()
+    for i in range(classes.shape[0]):
+        cls_id = int(classes[i])
+        if cls_id >= 0:
+            score = scores[i]
+            if cls_id not in colors:
+                colors[cls_id] = (random.random(), random.random(), random.random())
+            ymin = int(bboxes[i, 0] * height)
+            xmin = int(bboxes[i, 1] * width)
+            ymax = int(bboxes[i, 2] * height)
+            xmax = int(bboxes[i, 3] * width)
+#             crop_img = img[xmin:(xmax - xmin),xmax:(ymax - ymin)]
+#             misc.imsave('1.jpg', crop_img)
+            rect = plt.Rectangle((xmin, ymin), xmax - xmin,
+                                 ymax - ymin, fill=False,
+                                 edgecolor=colors[cls_id],
+                                 linewidth=linewidth)
+            plt.gca().add_patch(rect)
+            class_name = CLASSES[cls_id]
+            plt.gca().text(xmin, ymin - 2,
+                           '{:s} | {:.3f}'.format(class_name, score),
+                           bbox=dict(facecolor=colors[cls_id], alpha=0.5),
+                           fontsize=12, color='white')
+    plt.show()
+
+def write_file(file_name_string,seg):
+    with open(file_name_string, 'wb') as csvfile:
+     
+        spamwriter = csv.writer(csvfile, dialect='excel')
+        for i in range(seg.shape[0]):
+            spamwriter.writerow(seg[i][:])
+def test():
+    reconstructed_images = []
+    record_iterator = tf.python_io.tf_record_iterator(path=
+                                                      '/home/robin/Dataset/VOC/VOC2012_VOCtrainval/sematic_segmentation_tfrecord/val-00001-of-00002.tfrecord')
+    init=tf.global_variables_initializer()
+    with tf.Session() as sess:
+        sess.run(init)
+        coord=tf.train.Coordinator()     
+        threads= tf.train.start_queue_runners(coord=coord)
+       
+        
+        for string_iterator in record_iterator:
+            plt.figure(figsize=(12, 12))
+            example = tf.train.Example()
+            example.ParseFromString(string_iterator)
+            height = example.features.feature['image/height'].int64_list.value[0]
+            width = example.features.feature['image/width'].int64_list.value[0]
+            png_string = example.features.feature['image/encoded'].bytes_list.value[0]
+            #label = example.features.feature['image/object/class/label'].int64_list.value[0]
+            #xmin = example.features.feature['image/object/bbox/xmin'].float_list.value[0]
+            #xmax = example.features.feature['image/object/bbox/xmax'].float_list.value[0]
+            #ymin = example.features.feature['image/object/bbox/ymin'].float_list.value[0]
+            #ymax = example.features.feature['image/object/bbox/ymax'].float_list.value[0]
+            
+            encoded_mask_string = example.features.feature['image/segmentation/class/encoded'].bytes_list.value[0]
+            
+            plt.subplot(131)
+            mask_decode_png = tf.image.decode_png(encoded_mask_string, channels=1)
+            fix_mask =tf.cast(tf.greater(mask_decode_png,0),tf.uint8)
+           
+            
+            redecode_mask_img = sess.run(mask_decode_png)
+#             write_file("mask.csv",redecode_mask_img)
+            print(redecode_mask_img.shape)
+            redecode_mask = redecode_mask_img * 255
+            mask_img = np.squeeze(redecode_mask, axis = 2)
+            plt.imshow(mask_img)
+            plt.title('segmentation map')
+            #im = Image.fromarray(mask_img)
+            #im.save("pets.png")
+            
+            plt.subplot(132)
+            decoded_img = tf.image.decode_jpeg(png_string, channels=3)
+            reconstructed_img = sess.run(decoded_img)
+            print(reconstructed_img.shape)
+            plt.imshow(reconstructed_img)
+            plt.title('input image')
+           
+        
+            plt.subplot(133)
+            vis_util.draw_mask_on_image_array(
+                image = reconstructed_img,
+                mask = np.squeeze(sess.run(fix_mask), axis = 2),
+                alpha=0.8)
+            plt.imshow(reconstructed_img)
+            plt.title('segmentation overlay')
+  
+            plt.show()
+        
+        
+        
+        coord.request_stop()     
+        coord.join(threads)
+test()
+
@@ -0,0 +1,223 @@
+# Copyright 2018 The TensorFlow Authors All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Training script for the DeepLab model.
+
+See model.py for more details and usage.
+"""
+
+import six
+import tensorflow as tf
+
+import sys
+import os
+import cv2
+import numpy as np
+import csv
+from matplotlib import pyplot as plt
+# This is needed since the notebook is stored in the object_detection folder.
+TF_API="/home/robin/eclipse-workspace-python/TF_models/models/research"
+sys.path.append(os.path.split(TF_API)[0])
+sys.path.append(TF_API)
+
+from deeplab import common
+from deeplab import model
+from deeplab.datasets import segmentation_dataset
+from deeplab.utils import input_generator
+from deeplab.utils import train_utils
+from deployment import model_deploy
+from deeplab.utils import get_dataset_colormap
+
+
+slim = tf.contrib.slim
+
+prefetch_queue = slim.prefetch_queue
+
+flags = tf.app.flags
+
+
+# Settings for multi-GPUs/multi-replicas training.
+
+flags.DEFINE_integer('num_clones', 1, 'Number of clones to deploy.')
+
+flags.DEFINE_boolean('clone_on_cpu', False, 'Use CPUs to deploy clones.')
+
+flags.DEFINE_integer('num_replicas', 1, 'Number of worker replicas.')
+
+flags.DEFINE_integer('startup_delay_steps', 15,
+                     'Number of training steps between replicas startup.')
+
+flags.DEFINE_integer('num_ps_tasks', 0,
+                     'The number of parameter servers. If the value is 0, then '
+                     'the parameters are handled locally by the worker.')
+
+flags.DEFINE_string('master', '', 'BNS name of the tensorflow server')
+
+flags.DEFINE_integer('task', 0, 'The task ID.')
+
+# Settings for logging.
+
+
+
+# When fine_tune_batch_norm=True, use at least batch size larger than 12
+# (batch size more than 16 is better). Otherwise, one could use smaller batch
+# size and set fine_tune_batch_norm=False.
+flags.DEFINE_integer('train_batch_size', 2,
+                     'The number of images in each batch during training.')
+
+# For weight_decay, use 0.00004 for MobileNet-V2 or Xcpetion model variants.
+# Use 0.0001 for ResNet model variants.
+flags.DEFINE_float('weight_decay', 0.00004,
+                   'The value of the weight decay for training.')
+
+flags.DEFINE_multi_integer('train_crop_size', [513, 513],
+                           'Image crop size [height, width] during training.')
+
+flags.DEFINE_float('last_layer_gradient_multiplier', 1.0,
+                   'The gradient multiplier for last layers, which is used to '
+                   'boost the gradient of last layers if the value > 1.')
+
+flags.DEFINE_boolean('upsample_logits', True,
+                     'Upsample logits during training.')
+
+# Settings for fine-tuning the network.
+
+
+flags.DEFINE_float('min_scale_factor', 0.5,
+                   'Mininum scale factor for data augmentation.')
+
+flags.DEFINE_float('max_scale_factor', 2.,
+                   'Maximum scale factor for data augmentation.')
+
+flags.DEFINE_float('scale_factor_step_size', 0.25,
+                   'Scale factor step size for data augmentation.')
+
+# For `xception_65`, use atrous_rates = [12, 24, 36] if output_stride = 8, or
+# rates = [6, 12, 18] if output_stride = 16. For `mobilenet_v2`, use None. Note
+# one could use different atrous_rates/output_stride during training/evaluation.
+flags.DEFINE_multi_integer('atrous_rates', None,
+                           'Atrous rates for atrous spatial pyramid pooling.')
+
+flags.DEFINE_integer('output_stride', 16,
+                     'The ratio of input to output spatial resolution.')
+
+# Dataset settings.
+flags.DEFINE_string('dataset', 'pascal_voc_seg',
+                    'Name of the segmentation dataset.')
+
+flags.DEFINE_string('train_split', 'train',
+                    'Which split of the dataset to be used for training')
+
+flags.DEFINE_string('dataset_dir', "/home/robin/Dataset/VOC/VOC2012_VOCtrainval/sematic_segmentation_tfrecord", 'Where the dataset reside.')
+FLAGS = flags.FLAGS
+
+
+def write_file(file_name_string,seg):
+    with open(file_name_string, 'wb') as csvfile:
+        spamwriter = csv.writer(csvfile, dialect='excel')
+        for i in range(seg.shape[0]):
+            spamwriter.writerow(seg[i][:])
+
+def main(unused_argv):
+  tf.logging.set_verbosity(tf.logging.INFO)
+  # Set up deployment (i.e., multi-GPUs and/or multi-replicas).
+  config = model_deploy.DeploymentConfig(
+      num_clones=FLAGS.num_clones,
+      clone_on_cpu=FLAGS.clone_on_cpu,
+      replica_id=FLAGS.task,
+      num_replicas=FLAGS.num_replicas,
+      num_ps_tasks=FLAGS.num_ps_tasks)
+
+  # Split the batch across GPUs.
+  assert FLAGS.train_batch_size % config.num_clones == 0, (
+      'Training batch size not divisble by number of clones (GPUs).')
+
+  clone_batch_size = FLAGS.train_batch_size // config.num_clones
+
+  # Get dataset-dependent information.
+  dataset = segmentation_dataset.get_dataset(
+      FLAGS.dataset, FLAGS.train_split, dataset_dir=FLAGS.dataset_dir)
+
+ 
+
+  with tf.Graph().as_default() as graph:
+    with tf.device(config.inputs_device()):
+      samples = input_generator.get(
+          dataset,
+          FLAGS.train_crop_size,
+          clone_batch_size,
+          min_resize_value=FLAGS.min_resize_value,
+          max_resize_value=FLAGS.max_resize_value,
+          resize_factor=FLAGS.resize_factor,
+          min_scale_factor=FLAGS.min_scale_factor,
+          max_scale_factor=FLAGS.max_scale_factor,
+          scale_factor_step_size=FLAGS.scale_factor_step_size,
+          dataset_split=FLAGS.train_split,
+          is_training=True,
+          model_variant=FLAGS.model_variant)
+      inputs_queue = prefetch_queue.prefetch_queue(
+          samples, capacity=128 * config.num_clones)
+      
+      
+      samples = inputs_queue.dequeue()
+
+      # Add name to input and label nodes so we can add to summary.
+      samples[common.IMAGE] = tf.identity(samples[common.IMAGE], name=common.IMAGE)
+      samples[common.LABEL] = tf.identity(samples[common.LABEL], name=common.LABEL)
+      
+      print(samples)
+
+    # Create the global step on the device storing the variables.
+    with tf.device(config.variables_device()):
+      global_step = tf.train.get_or_create_global_step()
+      
+    
+    init=tf.global_variables_initializer()
+    with tf.Session() as session:
+        session.run(init)
+        
+        coord = tf.train.Coordinator()
+        threads = tf.train.start_queue_runners(coord=coord)
+        
+        print('Start verification process...')
+        try:
+          while True:
+            out_image, out_label  = session.run([samples[common.IMAGE],samples[common.LABEL]])
+            
+            #write_file("out_label.csv",np.squeeze(out_label[0], axis=2))
+            
+            cv2.imshow('out_image',cv2.cvtColor(out_image[0]/255,cv2.COLOR_RGB2BGR))
+            cv2.imshow('out_label',np.asarray(out_label[0]*100, dtype=np.uint8))
+
+            
+            
+            colored_label = get_dataset_colormap.label_to_color_image(np.squeeze(out_label[0]), dataset=get_dataset_colormap.get_pascal_name())
+            cv2.imshow("colored_label",cv2.cvtColor(colored_label.astype(np.uint8),cv2.COLOR_RGB2BGR))
+           
+            alpha = 0.5
+            img_add = cv2.addWeighted(out_image[0], alpha, colored_label.astype(np.float32), 1-alpha, 0)
+            cv2.imshow("colored_overlap",cv2.cvtColor(img_add,cv2.COLOR_RGB2BGR)/255)
+            cv2.waitKey(0)
+            
+
+        except tf.errors.OutOfRangeError:
+          print("end!") 
+
+        coord.request_stop()
+        coord.join(threads)
+
+if __name__ == '__main__':
+
+  flags.mark_flag_as_required('dataset_dir')
+  tf.app.run()
@@ -0,0 +1,158 @@
+# Copyright 2018 The TensorFlow Authors All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Training script for the DeepLab model.
+
+See model.py for more details and usage.
+"""
+
+import six
+import tensorflow as tf
+
+import sys
+import os
+import cv2
+import numpy as np
+
+import numpy as np
+import PIL.Image as img
+
+from matplotlib import gridspec
+from matplotlib import pyplot as plt
+
+# This is needed since the notebook is stored in the object_detection folder.
+TF_API="/home/robin/eclipse-workspace-python/TF_models/models/research"
+sys.path.append(os.path.split(TF_API)[0])
+sys.path.append(TF_API)
+
+from deeplab import common
+from deeplab import model
+from deeplab.datasets import segmentation_dataset
+from deeplab.utils import input_generator
+from deeplab.utils import train_utils
+from deeplab.utils import get_dataset_colormap
+from deployment import model_deploy
+from deeplab.core import preprocess_utils
+from deeplab import input_preprocess
+
+slim = tf.contrib.slim
+
+prefetch_queue = slim.prefetch_queue
+
+flags = tf.app.flags
+
+# Dataset settings.
+flags.DEFINE_string('dataset', 'ade20k',
+                    'Name of the segmentation dataset.')
+
+flags.DEFINE_string('train_split', 'train',
+                    'Which split of the dataset to be used for training')
+
+flags.DEFINE_string('dataset_dir', "/home/robin/Dataset/ADE20K/semantic_segmentation_tfrecord", 'Where the dataset reside.')
+FLAGS = flags.FLAGS
+
+def vis_segmentation(image, seg_map):
+  """Visualizes input image, segmentation map and overlay view."""
+  plt.figure(figsize=(16, 8))
+  grid_spec = gridspec.GridSpec(1, 4, width_ratios=[6, 6, 6, 1])
+
+  plt.subplot(grid_spec[0])
+  plt.imshow(image)
+  plt.axis('off')
+  plt.title('input image')
+
+  plt.subplot(grid_spec[1])
+  plt.imshow(seg_map)
+  plt.axis('off')
+  plt.title('segmentation map')
+
+  plt.subplot(grid_spec[2])
+  plt.imshow(image)
+  plt.imshow(seg_map, alpha=0.8)
+  plt.axis('off')
+  plt.title('segmentation overlay')
+  plt.show()
+
+def main(unused_argv):
+  tf.logging.set_verbosity(tf.logging.INFO)
+
+  # Get dataset-dependent information.
+  dataset = segmentation_dataset.get_dataset(
+      FLAGS.dataset, FLAGS.train_split, dataset_dir=FLAGS.dataset_dir)
+  
+  data_provider  = slim.dataset_data_provider.DatasetDataProvider(
+      dataset,
+      num_readers=3,
+      common_queue_capacity=20 * 1,
+      common_queue_min=10 * 1,
+      shuffle=False)
+  image, label, image_name, height, width = input_generator.get_decode_data(data_provider,
+                                                      FLAGS.train_split)
+  print(image, label, image_name, height, width)
+
+  original_image, processed_image, label = input_preprocess.preprocess_image_and_label(
+      image,
+      label,
+      crop_height=513,
+      crop_width=513,
+      min_resize_value=513,
+      max_resize_value=513,
+      resize_factor=None,
+      min_scale_factor=0.5,
+      max_scale_factor=2,
+      scale_factor_step_size=0.25,
+      ignore_label=0,
+      is_training=True,
+      model_variant="mobilenet_v2")
+
+  
+  init=tf.global_variables_initializer()
+  with tf.Session() as session:
+        session.run(init)
+        
+        coord = tf.train.Coordinator()
+        threads = tf.train.start_queue_runners(coord=coord)
+        
+        print('Start verification process...')
+        for l in range(data_provider._num_samples):
+            out_image, out_label, out_image_name, out_height, out_width = session.run([processed_image, label, image_name, height, width])
+
+#             print(out_label.shape)
+#             print(out_image ,out_label.shape ,out_height, out_width)
+#             print(out_image, out_label, out_image_name, out_height, out_width)
+             
+            
+#             vis_segmentation(out_image/255, np.squeeze(out_label, axis=2))
+            
+            colored_label = get_dataset_colormap.label_to_color_image(np.squeeze(out_label, axis=2), dataset=get_dataset_colormap.get_ade20k_name())
+            colored_label_uint8 = np.asarray(colored_label, dtype=np.uint8)
+            cv2.imshow("colored_label",cv2.cvtColor(colored_label_uint8,cv2.COLOR_RGB2BGR))
+     
+     
+            colored_label = colored_label.astype(np.float32) #np.asarray(colored_label, dtype=np.float32)
+            alpha = 0.3
+            img_add = img_add = cv2.addWeighted(out_image, alpha, colored_label, 1-alpha, 0)
+            cv2.imshow("colored_overlap",cv2.cvtColor(img_add,cv2.COLOR_RGB2BGR)/255)
+            cv2.waitKey(0)
+            
+            
+        coord.request_stop()
+        coord.join(threads)
+
+
+if __name__ == '__main__':
+#   flags.mark_flag_as_required('train_logdir')
+#   flags.mark_flag_as_required('tf_initial_checkpoint')
+  flags.mark_flag_as_required('dataset_dir')
+  tf.app.run()