HiKapok
diff --git a/Diff for: ‎README.md
+8 b/Diff for: ‎README.md
+8
diff --git a/Diff for: ‎convert_caffe_ron.py
+62 b/Diff for: ‎convert_caffe_ron.py
+62
diff --git a/Diff for: ‎datasets/dataset_factory.py
+29-1 b/Diff for: ‎datasets/dataset_factory.py
+29-1
diff --git a/Diff for: ‎datasets/pascalvoc_2007.py
+4-2 b/Diff for: ‎datasets/pascalvoc_2007.py
+4-2
diff --git a/Diff for: ‎datasets/pascalvoc_2007_2012.py
+118 b/Diff for: ‎datasets/pascalvoc_2007_2012.py
+118
diff --git a/Diff for: ‎datasets/pascalvoc_2012.py
+7-5 b/Diff for: ‎datasets/pascalvoc_2012.py
+7-5
diff --git a/Diff for: ‎datasets/pascalvoc_common.py
+23-2 b/Diff for: ‎datasets/pascalvoc_common.py
+23-2
@@ -6,5 +6,13 @@ This repository contains code of the re-implement of RON following the above pap
 
 The code is modified from [SSD-Tensorflow](https://github.com/balancap/SSD-Tensorflow). You can use the code to train/evaluate a network for object detection task. 
 For more details, please refer to [README of SSD-Tensorflow](https://github.com/balancap/SSD-Tensorflow/blob/master/README.md).
+##  ##
+update:
 
+- Add SSD preprocesing method using Tensorflow
+- Modify the network to match the original Caffe code
+- Add nms using Tensorflow ops to support two mode
+- Replica GPU training support
+- Add voc eval
 
+Note: Trainig is in process, and the model will be released later.
@@ -0,0 +1,62 @@
+#convert from caffe
+# https://github.com/hujie-frank/SENet
+# https://github.com/ruotianluo/pytorch-resnet
+# /ruotianluo/pytorch-resnet/master/convert.py
+#
+# install caffe python 3.6
+#   https://yangcha.github.io/Caffe-Conda3/
+
+# import caffe
+import sys
+import os
+sys.path.insert(0,'/media/rs/7A0EE8880EE83EAF1/Kapok/caffe-master/python')
+os.environ["GLOG_minloglevel"] = "2"
+import caffe
+from caffe.proto import caffe_pb2
+
+
+# others
+import re
+import numpy as np
+from collections import OrderedDict
+import cv2
+
+
+
+
+##--------------------------------------------------------
+
+# how to get caffe keys:
+#   caffe_model.params.keys()
+#   odict_keys(['conv1/7x7_s2', 'conv1/7x7_s2/bn', 'conv1/7x7_s2/bn/scale', 'conv2_1_1x1_reduce', 'conv2_1_1x1_reduce/bn', 'conv2_1_1x1_reduce/bn/scale', 'conv2_1_3x3', 'conv2_1_3x3/bn', 'conv2_1_3x3/bn/scale', 'conv2_1_1x1_increase', 'conv2_1_1x1_increase/bn', 'conv2_1_1x1_increase/bn/scale', 'conv2_1_1x1_down', 'conv2_1_1x1_up', 'conv2_1_1x1_proj', 'conv2_1_1x1_proj/bn', 'conv2_1_1x1_proj/bn/scale', 'conv2_2_1x1_reduce', 'conv2_2_1x1_reduce/bn', 'conv2_2_1x1_reduce/bn/scale', 'conv2_2_3x3', 'conv2_2_3x3/bn', 'conv2_2_3x3/bn/scale', 'conv2_2_1x1_increase', 'conv2_2_1x1_increase/bn', 'conv2_2_1x1_increase/bn/scale', 'conv2_2_1x1_down', 'conv2_2_1x1_up', 'conv2_3_1x1_reduce', 'conv2_3_1x1_reduce/bn', 'conv2_3_1x1_reduce/bn/scale', 'conv2_3_3x3', 'conv2_3_3x3/bn', 'conv2_3_3x3/bn/scale', 'conv2_3_1x1_increase', 'conv2_3_1x1_increase/bn', 'conv2_3_1x1_increase/bn/scale', 'conv2_3_1x1_down', 'conv2_3_1x1_up', 'conv3_1_1x1_reduce', 'conv3_1_1x1_reduce/bn', 'conv3_1_1x1_reduce/bn/scale', 'conv3_1_3x3', 'conv3_1_3x3/bn', 'conv3_1_3x3/bn/scale', 'conv3_1_1x1_increase', 'conv3_1_1x1_increase/bn', 'conv3_1_1x1_increase/bn/scale', 'conv3_1_1x1_down', 'conv3_1_1x1_up', 'conv3_1_1x1_proj', 'conv3_1_1x1_proj/bn', 'conv3_1_1x1_proj/bn/scale', 'conv3_2_1x1_reduce', 'conv3_2_1x1_reduce/bn', 'conv3_2_1x1_reduce/bn/scale', 'conv3_2_3x3', 'conv3_2_3x3/bn', 'conv3_2_3x3/bn/scale', 'conv3_2_1x1_increase', 'conv3_2_1x1_increase/bn', 'conv3_2_1x1_increase/bn/scale', 'conv3_2_1x1_down', 'conv3_2_1x1_up', 'conv3_3_1x1_reduce', 'conv3_3_1x1_reduce/bn', 'conv3_3_1x1_reduce/bn/scale', 'conv3_3_3x3', 'conv3_3_3x3/bn', 'conv3_3_3x3/bn/scale', 'conv3_3_1x1_increase', 'conv3_3_1x1_increase/bn', 'conv3_3_1x1_increase/bn/scale', 'conv3_3_1x1_down', 'conv3_3_1x1_up', 'conv3_4_1x1_reduce', 'conv3_4_1x1_reduce/bn', 'conv3_4_1x1_reduce/bn/scale', 'conv3_4_3x3', 'conv3_4_3x3/bn', 'conv3_4_3x3/bn/scale', 'conv3_4_1x1_increase', 'conv3_4_1x1_increase/bn', 'conv3_4_1x1_increase/bn/scale', 'conv3_4_1x1_down', 'conv3_4_1x1_up', 'conv4_1_1x1_reduce', 'conv4_1_1x1_reduce/bn', 'conv4_1_1x1_reduce/bn/scale', 'conv4_1_3x3', 'conv4_1_3x3/bn', 'conv4_1_3x3/bn/scale', 'conv4_1_1x1_increase', 'conv4_1_1x1_increase/bn', 'conv4_1_1x1_increase/bn/scale', 'conv4_1_1x1_down', 'conv4_1_1x1_up', 'conv4_1_1x1_proj', 'conv4_1_1x1_proj/bn', 'conv4_1_1x1_proj/bn/scale', 'conv4_2_1x1_reduce', 'conv4_2_1x1_reduce/bn', 'conv4_2_1x1_reduce/bn/scale', 'conv4_2_3x3', 'conv4_2_3x3/bn', 'conv4_2_3x3/bn/scale', 'conv4_2_1x1_increase', 'conv4_2_1x1_increase/bn', 'conv4_2_1x1_increase/bn/scale', 'conv4_2_1x1_down', 'conv4_2_1x1_up', 'conv4_3_1x1_reduce', 'conv4_3_1x1_reduce/bn', 'conv4_3_1x1_reduce/bn/scale', 'conv4_3_3x3', 'conv4_3_3x3/bn', 'conv4_3_3x3/bn/scale', 'conv4_3_1x1_increase', 'conv4_3_1x1_increase/bn', 'conv4_3_1x1_increase/bn/scale', 'conv4_3_1x1_down', 'conv4_3_1x1_up', 'conv4_4_1x1_reduce', 'conv4_4_1x1_reduce/bn', 'conv4_4_1x1_reduce/bn/scale', 'conv4_4_3x3', 'conv4_4_3x3/bn', 'conv4_4_3x3/bn/scale', 'conv4_4_1x1_increase', 'conv4_4_1x1_increase/bn', 'conv4_4_1x1_increase/bn/scale', 'conv4_4_1x1_down', 'conv4_4_1x1_up', 'conv4_5_1x1_reduce', 'conv4_5_1x1_reduce/bn', 'conv4_5_1x1_reduce/bn/scale', 'conv4_5_3x3', 'conv4_5_3x3/bn', 'conv4_5_3x3/bn/scale', 'conv4_5_1x1_increase', 'conv4_5_1x1_increase/bn', 'conv4_5_1x1_increase/bn/scale', 'conv4_5_1x1_down', 'conv4_5_1x1_up', 'conv4_6_1x1_reduce', 'conv4_6_1x1_reduce/bn', 'conv4_6_1x1_reduce/bn/scale', 'conv4_6_3x3', 'conv4_6_3x3/bn', 'conv4_6_3x3/bn/scale', 'conv4_6_1x1_increase', 'conv4_6_1x1_increase/bn', 'conv4_6_1x1_increase/bn/scale', 'conv4_6_1x1_down', 'conv4_6_1x1_up', 'conv5_1_1x1_reduce', 'conv5_1_1x1_reduce/bn', 'conv5_1_1x1_reduce/bn/scale', 'conv5_1_3x3', 'conv5_1_3x3/bn', 'conv5_1_3x3/bn/scale', 'conv5_1_1x1_increase', 'conv5_1_1x1_increase/bn', 'conv5_1_1x1_increase/bn/scale', 'conv5_1_1x1_down', 'conv5_1_1x1_up', 'conv5_1_1x1_proj', 'conv5_1_1x1_proj/bn', 'conv5_1_1x1_proj/bn/scale', 'conv5_2_1x1_reduce', 'conv5_2_1x1_reduce/bn', 'conv5_2_1x1_reduce/bn/scale', 'conv5_2_3x3', 'conv5_2_3x3/bn', 'conv5_2_3x3/bn/scale', 'conv5_2_1x1_increase', 'conv5_2_1x1_increase/bn', 'conv5_2_1x1_increase/bn/scale', 'conv5_2_1x1_down', 'conv5_2_1x1_up', 'conv5_3_1x1_reduce', 'conv5_3_1x1_reduce/bn', 'conv5_3_1x1_reduce/bn/scale', 'conv5_3_3x3', 'conv5_3_3x3/bn', 'conv5_3_3x3/bn/scale', 'conv5_3_1x1_increase', 'conv5_3_1x1_increase/bn', 'conv5_3_1x1_increase/bn/scale', 'conv5_3_1x1_down', 'conv5_3_1x1_up', 'classifier'])
+#
+
+# how to copy weights:
+# e.g.
+#   pytorch_state_dict['conv.weight'] = caffe_net_params['conv'][0].data
+#   pytorch_state_dict['conv.bias  '] = caffe_net_params['conv'][1].data
+
+
+
+# main #################################################################
+if __name__ == '__main__':
+    print('%s: calling main function ...' % os.path.basename(__file__))
+    prototxt_file = '/media/rs/3EBAC1C7BAC17BC1/Detections/RON_Tensorflow/traincudnn.prototxt'
+    caffemodel_file = '/media/rs/3EBAC1C7BAC17BC1/Detections/RON_Tensorflow/model/RON320_VOC0712_VOC07.caffemodel'
+
+    caffe.set_mode_cpu()
+    caffe_net = caffe.Net(prototxt_file, caffemodel_file, caffe.TEST)
+
+    caffe_net_params = caffe_net.params
+    print(caffe_model.params.keys())
+
+    exit(0)
+
+
+
+
+
+
+
+
+
@@ -23,12 +23,14 @@
 
 from datasets import pascalvoc_2007
 from datasets import pascalvoc_2012
+from datasets import pascalvoc_2007_2012
 
 datasets_map = {
     'cifar10': cifar10,
     'imagenet': imagenet,
     'pascalvoc_2007': pascalvoc_2007,
     'pascalvoc_2012': pascalvoc_2012,
+    'pascalvoc_0712': pascalvoc_2007_2012
 }
 
 
@@ -52,4 +54,30 @@ def get_dataset(name, split_name, dataset_dir, file_pattern=None, reader=None):
     return datasets_map[name].get_split(split_name,
                                         dataset_dir,
                                         file_pattern,
-                                        reader)
+                                        reader,
+                                        False)
+
+def get_replica_dataset(name, split_name, dataset_dir, num_workers, worker_index, file_pattern=None, reader=None):
+    """Given a dataset name and a split_name returns a Dataset.
+
+    Args:
+        name: String, the name of the dataset.
+        split_name: A train/test split name.
+        dataset_dir: The directory where the dataset files are stored.
+        file_pattern: The file pattern to use for matching the dataset source files.
+        reader: The subclass of tf.ReaderBase. If left as `None`, then the default
+            reader defined by each dataset is used.
+    Returns:
+        A `Dataset` class.
+    Raises:
+        ValueError: If the dataset `name` is unknown.
+    """
+    if name not in datasets_map:
+        raise ValueError('Name of dataset unknown %s' % name)
+    return datasets_map[name].get_split(split_name,
+                                        dataset_dir,
+                                        file_pattern,
+                                        reader,
+                                        True,
+                                        num_workers = num_workers,
+                                        worker_index = worker_index)
@@ -86,7 +86,7 @@
 NUM_CLASSES = 20
 
 
-def get_split(split_name, dataset_dir, file_pattern=None, reader=None):
+def get_split(split_name, dataset_dir, file_pattern=None, reader=None, replica=False, **kwargs):
     """Gets a dataset tuple with instructions for reading ImageNet.
 
     Args:
@@ -109,4 +109,6 @@ def get_split(split_name, dataset_dir, file_pattern=None, reader=None):
                                       file_pattern, reader,
                                       SPLITS_TO_SIZES,
                                       ITEMS_TO_DESCRIPTIONS,
-                                      NUM_CLASSES)
+                                      NUM_CLASSES,
+                                      replica,
+                                      **kwargs)
@@ -0,0 +1,118 @@
+# Copyright 2015 Paul Balanca. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Provides data for the Pascal VOC Dataset (images + annotations).
+"""
+import tensorflow as tf
+from datasets import pascalvoc_common
+
+slim = tf.contrib.slim
+
+FILE_PATTERN = 'voc_20??_%s_*.tfrecord'
+ITEMS_TO_DESCRIPTIONS = {
+    'image': 'A color image of varying height and width.',
+    'shape': 'Shape of the image',
+    'object/bbox': 'A list of bounding boxes, one per each object.',
+    'object/label': 'A list of labels, one per each object.',
+}
+# (Images, Objects) statistics on every class.
+TRAIN_STATISTICS = {
+    'cow': (444, 847),
+    'car': (1874, 3267),
+    'pottedplant': (772, 1487),
+    'none': (0, 0),
+    'person': (6095, 13256),
+    'bicycle': (795, 1064),
+    'bottle': (950, 1764),
+    'dog': (1707, 2025),
+    'motorbike': (771, 1052),
+    'boat': (689, 1140),
+    'train': (805, 925),
+    'total': (16551, 40058),
+    'diningtable': (738, 824),
+    'sheep': (421, 1070),
+    'bus': (607, 822),
+    'aeroplane': (908, 1171),
+    'sofa': (736, 814),
+    'chair': (1564, 3152),
+    'tvmonitor': (831, 1108),
+    'horse': (769, 1072),
+    'cat': (1417, 1593),
+    'bird': (1095, 1605)
+}
+
+TEST_STATISTICS = {
+    'none': (0, 0),
+    'aeroplane': (1, 1),
+    'bicycle': (1, 1),
+    'bird': (1, 1),
+    'boat': (1, 1),
+    'bottle': (1, 1),
+    'bus': (1, 1),
+    'car': (1, 1),
+    'cat': (1, 1),
+    'chair': (1, 1),
+    'cow': (1, 1),
+    'diningtable': (1, 1),
+    'dog': (1, 1),
+    'horse': (1, 1),
+    'motorbike': (1, 1),
+    'person': (1, 1),
+    'pottedplant': (1, 1),
+    'sheep': (1, 1),
+    'sofa': (1, 1),
+    'train': (1, 1),
+    'tvmonitor': (1, 1),
+    'total': (20, 20),
+}
+SPLITS_TO_SIZES = {
+    'train': 22136,
+    'test': 4952,
+}
+SPLITS_TO_STATISTICS = {
+    'train': TRAIN_STATISTICS,
+    'test': TEST_STATISTICS,
+}
+NUM_CLASSES = 20
+
+
+def get_split(split_name, dataset_dir, file_pattern=None, reader=None, replica=False, **kwargs):
+    """Gets a dataset tuple with instructions for reading ImageNet.
+
+    Args:
+      split_name: A train/test split name.
+      dataset_dir: The base directory of the dataset sources.
+      file_pattern: The file pattern to use when matching the dataset sources.
+        It is assumed that the pattern contains a '%s' string so that the split
+        name can be inserted.
+      reader: The TensorFlow reader type.
+
+    Returns:
+      A `Dataset` namedtuple.
+
+    Raises:
+        ValueError: if `split_name` is not a valid train/test split.
+    """
+    if not file_pattern:
+        file_pattern = FILE_PATTERN
+    return pascalvoc_common.get_split(split_name, dataset_dir,
+                                      file_pattern, reader,
+                                      SPLITS_TO_SIZES,
+                                      ITEMS_TO_DESCRIPTIONS,
+                                      NUM_CLASSES,
+                                      replica,
+                                      **kwargs)
+
+# for k, v in TRAIN_STATISTICS2.items():
+#     print("'{}': ({}, {})".format(k ,v[0]+TRAIN_STATISTICS1[k][0],v[1]+TRAIN_STATISTICS1[k][1]))
@@ -60,7 +60,7 @@
 NUM_CLASSES = 20
 
 
-def get_split(split_name, dataset_dir, file_pattern=None, reader=None):
+def get_split(split_name, dataset_dir, file_pattern=None, reader=None, replica=False, **kwargs):
     """Gets a dataset tuple with instructions for reading ImageNet.
 
     Args:
@@ -80,8 +80,10 @@ def get_split(split_name, dataset_dir, file_pattern=None, reader=None):
     if not file_pattern:
         file_pattern = FILE_PATTERN
     return pascalvoc_common.get_split(split_name, dataset_dir,
-                                      file_pattern, reader,
-                                      SPLITS_TO_SIZES,
-                                      ITEMS_TO_DESCRIPTIONS,
-                                      NUM_CLASSES)
+                                        file_pattern, reader,
+                                        SPLITS_TO_SIZES,
+                                        ITEMS_TO_DESCRIPTIONS,
+                                        NUM_CLASSES,
+                                        replica,
+                                        **kwargs)
 
@@ -45,9 +45,15 @@
     'tvmonitor': (20, 'Indoor'),
 }
 
+VOC_CLASSES = (  # always index 0
+    'aeroplane', 'bicycle', 'bird', 'boat',
+    'bottle', 'bus', 'car', 'cat', 'chair',
+    'cow', 'diningtable', 'dog', 'horse',
+    'motorbike', 'person', 'pottedplant',
+    'sheep', 'sofa', 'train', 'tvmonitor')
 
 def get_split(split_name, dataset_dir, file_pattern, reader,
-              split_to_sizes, items_to_descriptions, num_classes):
+              split_to_sizes, items_to_descriptions, num_classes, replica, **kwargs):
     """Gets a dataset tuple with instructions for reading Pascal VOC dataset.
 
     Args:
@@ -66,7 +72,22 @@ def get_split(split_name, dataset_dir, file_pattern, reader,
     """
     if split_name not in split_to_sizes:
         raise ValueError('split name %s was not recognized.' % split_name)
-    file_pattern = os.path.join(dataset_dir, file_pattern % split_name)
+
+    if replica:
+        if 'num_workers' not in kwargs:
+            raise ValueError('Must provide "num_workers" for slim DatasetDataProvider.')
+        if 'worker_index' not in kwargs:
+            raise ValueError('Must provide "worker_index" for slim DatasetDataProvider.')
+        if not (kwargs['worker_index'] < kwargs['num_workers']):
+            raise ValueError('"worker_index" must in the range [0, num_workers].')
+        input_file_list = tf.gfile.Glob(os.path.join(dataset_dir, file_pattern % split_name))
+
+        slice_start = int(kwargs['worker_index']*len(input_file_list)/kwargs['num_workers'])
+        slice_end = int((kwargs['worker_index']+1)*len(input_file_list)/kwargs['num_workers'])
+        input_file_list.sort()
+        file_pattern = input_file_list[slice_start:slice_end]
+    else:
+        file_pattern = os.path.join(dataset_dir, file_pattern % split_name)
 
     # Allowing None in the signature so that dataset_factory can use the default.
     if reader is None: