From c0211deb41967a28ceff77ce6ef4de7c5da3ed2e Mon Sep 17 00:00:00 2001
From: "Zhang, Guoming" <guoming.zhang@intel.com>
Date: Thu, 30 Nov 2017 22:41:15 +0800
Subject: [PATCH 01/53] 1.Enable the conv/eltwise/relu fusion; 2.Add the
 -DENABLE_CONV_SUM_FUSION option to enable this feature.

Change-Id: Ia9a64ade38de0afb2f1abcc0f7855c8b2f8e2170
---
 Makefile                                      |  5 ++
 Makefile.config.example                       |  5 +-
 cmake/Misc.cmake                              |  6 ++
 include/caffe/layers/base_conv_layer.hpp      |  3 +-
 include/caffe/net.hpp                         |  7 +-
 src/caffe/layers/base_conv_layer.cpp          |  2 +
 src/caffe/layers/mkldnn_convolution_layer.cpp | 26 ++++++-
 src/caffe/net.cpp                             | 73 +++++++++++++++++++
 8 files changed, 120 insertions(+), 7 deletions(-)
diff --git a/Makefile b/Makefile
index 22575b4b1..10a10a1d9 100644
--- a/Makefile
+++ b/Makefile
@@ -492,6 +492,11 @@ ifeq ($(DISABLE_BN_FOLDING), 1)
 	COMMON_FLAGS += -DDISABLE_BN_FOLDING
 endif
 
+# Disable the conv/eltwise/relu layer fusion
+ifeq ($(DISABLE_CONV_SUM_FUSION), 1)
+	COMMON_FLAGS += -DDISABLE_CONV_SUM_FUSION
+endif
+
 # Performance monitoring
 ifeq ($(PERFORMANCE_MONITORING), 1)
 	CXXFLAGS += -DPERFORMANCE_MONITORING
diff --git a/Makefile.config.example b/Makefile.config.example
index b552ca458..f157f34f7 100644
--- a/Makefile.config.example
+++ b/Makefile.config.example
@@ -76,8 +76,11 @@ USE_MKLDNN_AS_DEFAULT_ENGINE := 1
 # already. 
 # BOOST_ROOT := 
 
-# Use remove batch norm optimization to boost inferrence
+# Use remove batch norm optimization to boost inference
 DISABLE_BN_FOLDING := 0
+
+#Use conv/eltwise/relu layer fusion to boost inference.
+ENABLE_CONV_SUM_FUSION := 0
 # Intel(r) Machine Learning Scaling Library (uncomment to build
 # with MLSL for multi-node training)
 # USE_MLSL :=1
diff --git a/cmake/Misc.cmake b/cmake/Misc.cmake
index 0657ee1e9..70171ce96 100644
--- a/cmake/Misc.cmake
+++ b/cmake/Misc.cmake
@@ -10,6 +10,12 @@ if(DISABLE_BN_FOLDING)
 	message(STATUS "Bn folding is disabled!")
 	add_definitions("-DDISABLE_BN_FOLDING")
 endif()
+
+if(ENABLE_CONV_SUM_FUSION)
+	message(STATUS "conv/eltwise/relu fusion is disabled!")
+	add_definitions("-DENABLE_CONV_SUM_FUSION")
+endif()
+
 # --[ If user doesn't specify build type then assume release
 if("${CMAKE_BUILD_TYPE}" STREQUAL "")
   set(CMAKE_BUILD_TYPE Release)
diff --git a/include/caffe/layers/base_conv_layer.hpp b/include/caffe/layers/base_conv_layer.hpp
index 00a819920..5dd5ca48b 100755
--- a/include/caffe/layers/base_conv_layer.hpp
+++ b/include/caffe/layers/base_conv_layer.hpp
@@ -63,8 +63,9 @@ class BaseConvolutionLayer : public Layer<Dtype> {
 
   virtual inline int MinBottomBlobs() const { return 1; }
   virtual inline int MinTopBlobs() const { return 1; }
+#ifndef ENABLE_CONV_SUM_FUSION
   virtual inline bool EqualNumBottomTopBlobs() const { return true; }
-
+#endif
  protected:
   // Split Reshape into two parts
   // Part 1 for normal blob reshape 
diff --git a/include/caffe/net.hpp b/include/caffe/net.hpp
index c8e274c6d..71cce7b73 100644
--- a/include/caffe/net.hpp
+++ b/include/caffe/net.hpp
@@ -304,7 +304,12 @@ class Net {
   static void CompilationRuleThree(const NetParameter& param,
                              NetParameter* param_compiled);
 
-
+  /**
+  * @brief This is rule analyze for conv/elt/relu fusion.
+  */
+  static void CompilationRuleFour(const NetParameter& param,
+                             NetParameter* param_compiled);
+  
   /**
    * @brief If find "Conv--BN--Scale" in current network, merge BN and Scale layer into Convolution
    * layers, this optimization only works in caffe TEST phase now.
diff --git a/src/caffe/layers/base_conv_layer.cpp b/src/caffe/layers/base_conv_layer.cpp
index 205be870c..9f967b43d 100644
--- a/src/caffe/layers/base_conv_layer.cpp
+++ b/src/caffe/layers/base_conv_layer.cpp
@@ -232,11 +232,13 @@ void BaseConvolutionLayer<Dtype>::DoReshape(const vector<Blob<Dtype>*>& bottom,
   num_ = bottom[0]->count(0, channel_axis_);
   CHECK_EQ(bottom[0]->shape(channel_axis_), channels_)
       << "Input size incompatible with convolution kernel.";
+#ifndef ENABLE_CONV_SUM_FUSION
   // TODO: generalize to handle inputs of different shapes.
   for (int bottom_id = 1; bottom_id < bottom.size(); ++bottom_id) {
     CHECK(bottom[0]->shape() == bottom[bottom_id]->shape())
         << "All inputs must have the same shape.";
   }
+#endif
   // Shape the tops.
   bottom_shape_ = &bottom[0]->shape();
   compute_output_shape();
diff --git a/src/caffe/layers/mkldnn_convolution_layer.cpp b/src/caffe/layers/mkldnn_convolution_layer.cpp
index 6d0778adb..4244f7f2f 100644
--- a/src/caffe/layers/mkldnn_convolution_layer.cpp
+++ b/src/caffe/layers/mkldnn_convolution_layer.cpp
@@ -145,6 +145,12 @@ void MKLDNNConvolutionLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom
                      this->num_ == bottom[0]->num()) ? false : true;
     init_properties(bottom, top);
     BaseConvolutionLayer<Dtype>::ReshapeForMKL(bottom, top);
+
+#ifdef ENABLE_CONV_SUM_FUSION
+    if (bottom.size() > 1) {
+        top[0]->ShareData(*bottom[1]);
+    }
+#endif
 }
 
 template <typename Dtype>
@@ -203,11 +209,20 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionFwd(const vector<Blob<Dtype>*
     convFwd_pd = NULL;
     mkldnn::primitive_attr attr;
     mkldnn::post_ops ops;
-    
+
+#ifdef ENABLE_CONV_SUM_FUSION
+    if(relu || bottom.size() > 1) {
+#else
     if(relu) {
+#endif
         float scale = 1.0f; //for fp32, scale is 1.
         Dtype alpha = negative_slope;  // negative slope for mkldnn_eltwise_relu.
         float beta = 1.0f;  //ignored for mkldnn_eltwise_relu.
+#ifdef ENABLE_CONV_SUM_FUSION
+    if (bottom.size() > 1) {
+        ops.append_sum(1.0f);
+    }
+#endif
         ops.append_eltwise(scale, eltwise_relu, alpha, beta);
         attr.set_post_ops(ops);
     }
@@ -230,10 +245,13 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionFwd(const vector<Blob<Dtype>*
       for (subEngineIndex = 0; subEngineIndex < ep.getNumberOfSubEngines();
            subEngineIndex++) {
         try {
-          if (relu) {
-            convFwd_pd.reset(new convolution_forward::primitive_desc(
+#ifdef ENABLE_CONV_SUM_FUSION
+            if(relu || bottom.size() > 1) {
+#else
+            if(relu) {
+#endif
+                convFwd_pd.reset(new convolution_forward::primitive_desc(
                 *convFwd_desc, attr, ep.getMKLDNNSubEngine(subEngineIndex)));
-
           } else {
             convFwd_pd.reset(new convolution_forward::primitive_desc(
                 *convFwd_desc, ep.getMKLDNNSubEngine(subEngineIndex)));
diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
index 0afc6d31f..4a9a9621a 100644
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -529,9 +529,20 @@ void Net<Dtype>::CompileNet(const NetParameter& param,
   param_temp2.clear_layer();   // Remove layers
   CompilationRuleTwo(param_temp, &param_temp2);
 
+#ifndef ENABLE_CONV_SUM_FUSION
   param_compiled->CopyFrom(param_temp2);
   param_compiled->clear_layer();    // Remove layers
   CompilationRuleThree(param_temp2, param_compiled);
+#else
+  NetParameter param_temp3;
+  param_temp3.CopyFrom(param_temp2);
+  param_temp3.clear_layer();
+  CompilationRuleThree(param_temp2, &param_temp3);
+
+  param_compiled->CopyFrom(param_temp3);
+  param_compiled->clear_layer();
+  CompilationRuleFour(param_temp3, param_compiled);
+#endif 
 }
 
 template <typename Dtype>
@@ -832,6 +843,68 @@ void Net<Dtype>::CompilationRuleThree(const NetParameter& param,
   return;
 }
 
+template <typename Dtype>
+void Net<Dtype>::CompilationRuleFour(const NetParameter& param,
+                                     NetParameter* param_compiled) {
+  // only apply this rule for inference(TEST) phase
+  if (param.state().phase() != TEST) {
+    param_compiled->CopyFrom(param);
+    return;
+  }
+  string blob_need_to_insert;
+  LayerParameter* need_to_convert_layer = NULL;
+  for (int i = 0; i < param.layer_size(); i++) {
+    LayerParameter* layer_param =
+        (const_cast<NetParameter&>(param)).mutable_layer(i);
+    if (layer_param->type().compare("Convolution") == 0) {
+      std::vector<const LayerParameter*> child_layers_params;
+      Net<Dtype>::GetBlobConsumers(child_layers_params, layer_param->top(0),
+                                   param,
+                                   i + 1 < param.layer_size() ? i + 1 : i);
+
+      if (child_layers_params[0]->type().compare("Eltwise") == 0) {
+        std::vector<const LayerParameter*> grand_child_layers_params;
+
+        Net<Dtype>::GetBlobConsumers(grand_child_layers_params,
+                                     child_layers_params[0]->top(0), param,
+                                     i + 1 < param.layer_size() ? i + 1 : i);
+        const LayerParameter& grand_child_layer_param =
+            grand_child_layers_params.size() > 0
+                ? *(grand_child_layers_params[0])
+                : *layer_param;
+
+        if (grand_child_layer_param.type().compare("ReLU") != 0) {
+          param_compiled->add_layer()->CopyFrom(*layer_param);
+          continue;
+        }
+
+        if (child_layers_params[0]->bottom(0) == layer_param->top(0) ) {
+          param_compiled->add_layer()->CopyFrom(*layer_param);
+          need_to_convert_layer = layer_param;
+          continue;
+        }
+
+        const_cast<string&>(layer_param->top(0)) =
+            grand_child_layer_param.top(0);
+        if (need_to_convert_layer != NULL) {
+          layer_param->add_bottom(
+              const_cast<string&>(need_to_convert_layer->top(0)));
+          need_to_convert_layer = NULL;
+        } else {
+          layer_param->add_bottom(
+              const_cast<string&>(child_layers_params[0]->bottom(0)));
+        }
+
+        i += 2;  // skip next eltwise and relu
+      }
+    }
+
+    param_compiled->add_layer()->CopyFrom(*layer_param);
+  }
+
+  return;
+}
+
 template <typename Dtype>
 void Net<Dtype>::GetBlobConsumers(
                   std::vector<const LayerParameter*>& consumer_blobs,

From b8b4ed04eb423e5f7096abe3de05051347956128 Mon Sep 17 00:00:00 2001
From: Haihao Shen <haihao.shen@intel.com>
Date: Fri, 1 Dec 2017 14:24:51 +0800
Subject: [PATCH 02/53] Enable winograd when kernel size is 3x3, stride is
 unit, and output is 16 dividable

---
 examples/pycaffe/tune_model.py | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/examples/pycaffe/tune_model.py b/examples/pycaffe/tune_model.py
index 628adf9c0..cf2bd6334 100644
--- a/examples/pycaffe/tune_model.py
+++ b/examples/pycaffe/tune_model.py
@@ -10,7 +10,13 @@ def genOptimalModel(net, mkldnn_direct_time_map, mkldnn_winograd_time_map, optim
     for index in range(0, len(net.layer)):
         l = net.layer[index]
         if l.type == "Convolution":
-            if mkldnn_winograd_time_map[l.name] < mkldnn_direct_time_map[l.name]:
+            if len(l.convolution_param.kernel_size) == 0:
+                continue
+            kernel_size = l.convolution_param.kernel_size[0]
+            stride = 1
+            if len(l.convolution_param.stride) != 0:
+                stride = l.convolution_param.stride[0]
+            if mkldnn_winograd_time_map[l.name] < mkldnn_direct_time_map[l.name] and kernel_size == 3 and stride == 1 and l.convolution_param.num_output % 16 ==0:
                 l.convolution_param.conv_algorithm = "winograd"
             else:
                 l.convolution_param.conv_algorithm = "direct"

From 8e61bbed143af1a5776d66d37d173924935c92db Mon Sep 17 00:00:00 2001
From: fzou1 <feng.zou@intel.com>
Date: Mon, 4 Dec 2017 16:43:01 +0800
Subject: [PATCH 03/53] support collecting single node performance to do
 apple-to-apple comparision with multinode

---
 include/caffe/net.hpp                | 56 ++++++++++++++++++++++++++
 include/caffe/solver.hpp             |  1 +
 src/caffe/multinode/multi_solver.cpp | 59 +++-------------------------
 src/caffe/net.cpp                    | 10 +++++
 src/caffe/solver.cpp                 |  9 ++---
 src/caffe/solvers/sgd_solver.cpp     | 34 ++++++++++++++++
 6 files changed, 110 insertions(+), 59 deletions(-)

diff --git a/include/caffe/net.hpp b/include/caffe/net.hpp
index 71cce7b73..8438bfa06 100644
--- a/include/caffe/net.hpp
+++ b/include/caffe/net.hpp
@@ -51,6 +51,55 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 namespace caffe {
 
+#ifdef CAFFE_PER_LAYER_TIMINGS
+  template <typename Dtype> class Solver;
+
+#define LAYER_TIMING_START() do { \
+  root_solver_->timer.Start(); \
+}while(0)
+
+#define LAYER_TIMING_STOP(name, index) do { \
+  root_solver_->name##_time_per_layer[index] += root_solver_->timer.MicroSeconds(); \
+}while(0)
+
+#ifdef FW_OVERLAP_OPT
+#define LAYER_WAIT_TIMING_START() do { \
+  root_solver_->wait_timer.Start(); \
+}while(0)
+
+#define LAYER_WAIT_TIMING_STOP(layer_index) do { \
+  root_solver_->waitcomm_time_per_layer[layer_index] += root_solver_->wait_timer.MicroSeconds(); \
+}while(0)
+
+#define LAYER_REMOVE_UPDATE_TIME(layer_i, layer_k) do { \
+  root_solver_->waitcomm_time_per_layer[layer_i] -= root_solver_->update_time_per_layer[layer_k]; \
+} while (0)
+#endif
+
+#define ITER_TIMING_START() do { \
+  root_solver_->timer.Start(); \
+}while(0)
+
+#define ITER_TIMING_STOP(name) do { \
+  root_solver_->name##_time_per_iter += root_solver_->timer.MicroSeconds(); \
+}while(0)
+
+#else
+
+#define LAYER_TIMING_START()
+#define LAYER_TIMING_STOP(name,index)
+
+#ifdef FW_OVERLAP_OPT
+#define LAYER_WAIT_TIMING_START()
+#define LAYER_WAIT_TIMING_STOP(index)
+#define LAYER_REMOVE_UPDATE_TIME(layer_i, layer_k)
+#endif
+
+#define ITER_TIMING_START()
+#define ITER_TIMING_STOP(name)
+
+#endif /* CAFFE_PER_LAYER_TIMINGS */
+
 /**
  * @brief Connects Layer%s together into a directed acyclic graph (DAG)
  *        specified by a NetParameter.
@@ -336,6 +385,9 @@ class Net {
   /// @brief return whether NetState state meets NetStateRule rule
   static bool StateMeetsRule(const NetState& state, const NetStateRule& rule,
       const string& layer_name);
+#ifdef CAFFE_PER_LAYER_TIMINGS
+  void set_root_solver(Solver<Dtype> * solver) { root_solver_ = solver; }
+#endif
   inline const map<string,int>& blob_names_index() const {
     return blob_names_index_;
   }
@@ -425,6 +477,10 @@ class Net {
   /// The root net that actually holds the shared layers in data parallelism
   const Net* const root_net_;
   DISABLE_COPY_AND_ASSIGN(Net);
+
+#ifdef CAFFE_PER_LAYER_TIMINGS
+  Solver<Dtype> * root_solver_;
+#endif
 };
 
 
diff --git a/include/caffe/solver.hpp b/include/caffe/solver.hpp
index 5b48287b9..71489fbb8 100644
--- a/include/caffe/solver.hpp
+++ b/include/caffe/solver.hpp
@@ -189,6 +189,7 @@ class Solver {
   void InitTimers();
   void ResetTimers();
   void PrintTimers(bool printTotal);
+
 #endif /* CAFFE_PER_LAYER_TIMINGS */
 
  protected:
diff --git a/src/caffe/multinode/multi_solver.cpp b/src/caffe/multinode/multi_solver.cpp
index 4f3df7838..2887d1a43 100644
--- a/src/caffe/multinode/multi_solver.cpp
+++ b/src/caffe/multinode/multi_solver.cpp
@@ -46,53 +46,6 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 namespace caffe {
 
-#ifdef CAFFE_PER_LAYER_TIMINGS
-
-#define LAYER_TIMING_START() do { \
-  root_solver_->timer.Start(); \
-}while(0)
-
-#define LAYER_TIMING_STOP(name, index) do { \
-  root_solver_->name##_time_per_layer[index] += root_solver_->timer.MicroSeconds(); \
-}while(0)
-
-#ifdef FW_OVERLAP_OPT
-#define LAYER_WAIT_TIMING_START() do { \
-  root_solver_->wait_timer.Start(); \
-}while(0)
-
-#define LAYER_WAIT_TIMING_STOP(layer_index) do { \
-  root_solver_->waitcomm_time_per_layer[layer_index] += root_solver_->wait_timer.MicroSeconds(); \
-}while(0)
-
-#define LAYER_REMOVE_UPDATE_TIME(layer_i, layer_k) do { \
-  root_solver_->waitcomm_time_per_layer[layer_i] -= root_solver_->update_time_per_layer[layer_k]; \
-} while (0)
-#endif
-
-#define ITER_TIMING_START() do { \
-  root_solver_->timer.Start(); \
-}while(0)
-
-#define ITER_TIMING_STOP(name) do { \
-  root_solver_->name##_time_per_iter += root_solver_->timer.MicroSeconds(); \
-}while(0)
-
-#else
-
-#define LAYER_TIMING_START()
-#define LAYER_TIMING_STOP(name,index)
-
-#ifdef FW_OVERLAP_OPT
-#define LAYER_WAIT_TIMING_START()
-#define LAYER_WAIT_TIMING_STOP(layer_index)
-#define LAYER_REMOVE_UPDATE_TIME(layer_i, layer_k)
-#endif
-
-#define ITER_TIMING_START()
-#define ITER_TIMING_STOP(name)
-
-#endif
 
 template <typename Dtype>
 inline bool MultiSolver<Dtype>::IsSkipWaitGradient(int layer_id) {
@@ -117,6 +70,7 @@ inline bool MultiSolver<Dtype>::WaitGradient(int layer_id) {
   for (int j = 0; j < callbacks_.size(); ++j) {
     callbacks_[j]->on_delwt_wait(layer_id);
   }
+
 #ifndef FW_OVERLAP_OPT
   LAYER_TIMING_STOP(waitcomm, layer_id);
   return true;
@@ -130,11 +84,13 @@ inline void MultiSolver<Dtype>::UpdateGradient(int layer_id) {
 #ifdef FW_OVERLAP_OPT
   if (layer_finished_flags_[layer_id]) {
 #endif
+
     LAYER_TIMING_START();
     for (int j = 0; j < callbacks_.size(); ++j) {
       callbacks_[j]->apply_updates(layer_id);
     }
     LAYER_TIMING_STOP(update, layer_id);
+
 #ifdef FW_OVERLAP_OPT
   }
 #endif
@@ -188,30 +144,25 @@ Dtype MultiSolver<Dtype>::ForwardBackwardImpl(bool first, bool last) {
     }
 #endif
 
-    LAYER_TIMING_START();
     loss += net.ForwardFromTo(i, i);
-    LAYER_TIMING_STOP(forward, i);
   }
 
   // Clear parameter diffs after communication is finished (that is, after 
   // calling WaitGradientComm)
   if (first) {
-    ITER_TIMING_START();
     root_solver_->net()->ClearParamDiffs();
-    ITER_TIMING_STOP(cleardiffs);
   }
 
   for (int i = layers.size() - 1; i >= 0; --i) {
     if (!layer_need_backward[i]) {
       continue;
     }
-
-    LAYER_TIMING_START();
+    
     net.BackwardFromTo(i, i);
-    LAYER_TIMING_STOP(backward, i);
 
     if (last && (layers[i]->layerOp != nullptr)
         && layers[i]->layerOp->HasParameterSets()) {
+
       LAYER_TIMING_START();
       for (int j = 0; j < callbacks_.size(); ++j) {
         callbacks_[j]->on_backward_finished(i);
diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
index 4a9a9621a..fa8a03b13 100644
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -64,6 +64,10 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 #include "caffe/util/remove_batch_norm.hpp"
 #include "caffe/util/apply_bn_stats_batch_size.hpp"
 
+#ifdef CAFFE_PER_LAYER_TIMINGS
+#include "caffe/solver.hpp"
+#endif
+
 PERFORMANCE_CREATE_MONITOR();
 
 namespace caffe {
@@ -1230,12 +1234,14 @@ Dtype Net<Dtype>::ForwardFromTo(int start, int end) {
   CHECK_LT(end, layers_.size());
   Dtype loss = 0;
   for (int i = start; i <= end; ++i) {
+    LAYER_TIMING_START();
     PERFORMANCE_MEASUREMENT_BEGIN();
 
     // LOG(ERROR) << "Forwarding " << layer_names_[i];
     Dtype layer_loss = layers_[i]->Forward(bottom_vecs_[i], top_vecs_[i]);
 
     PERFORMANCE_MEASUREMENT_END((std::string("FW_") + layer_names_[i]).c_str());
+    LAYER_TIMING_STOP(forward, i);
 
     loss += layer_loss;
     if (debug_info_) { ForwardDebugInfo(i); }
@@ -1281,12 +1287,14 @@ void Net<Dtype>::BackwardFromTo(int start, int end) {
   CHECK_LT(start, layers_.size());
   for (int i = start; i >= end; --i) {
     if (layer_need_backward_[i]) {
+      LAYER_TIMING_START();
       PERFORMANCE_MEASUREMENT_BEGIN();
 
       layers_[i]->Backward(
           top_vecs_[i], bottom_need_backward_[i], bottom_vecs_[i]);
 
       PERFORMANCE_MEASUREMENT_END((std::string("BW_")+layer_names_[i]).c_str());
+      LAYER_TIMING_STOP(backward, i);
 
       if (debug_info_) { BackwardDebugInfo(i); }
     }
@@ -1794,9 +1802,11 @@ void Net<Dtype>::ClearParamDiffs(int learnable_param_id) {
 
 template <typename Dtype>
 void Net<Dtype>::ClearParamDiffs() {
+  ITER_TIMING_START();
   for (int i = 0; i < learnable_params_.size(); ++i) {
     ClearParamDiffs(i);
   }
+  ITER_TIMING_STOP(cleardiffs);
 }
 
 template <typename Dtype>
diff --git a/src/caffe/solver.cpp b/src/caffe/solver.cpp
index 781aca9d7..f566ce935 100644
--- a/src/caffe/solver.cpp
+++ b/src/caffe/solver.cpp
@@ -125,6 +125,7 @@ void Solver<Dtype>::Init(const SolverParameter& param) {
 
 #ifdef CAFFE_PER_LAYER_TIMINGS
   InitTimers();
+  net_->set_root_solver(this);
 #endif
 }
 
@@ -340,11 +341,6 @@ void Solver<Dtype>::Step(int iters) {
       }
     }
 
-#ifdef CAFFE_PER_LAYER_TIMINGS
-    PrintTimers(false);
-    ResetTimers();
-#endif
-
     iter_timer.Start();
 
     for (int i = 0; i < callbacks_.size(); ++i) {
@@ -361,6 +357,9 @@ void Solver<Dtype>::Step(int iters) {
     iter_time += iter_timer.MilliSeconds();
 
 #ifdef CAFFE_PER_LAYER_TIMINGS
+    PrintTimers(false);
+    ResetTimers();
+
     if (mn::get_node_id() == 0)
         LOG(INFO) << "iter " << iter_ << ", forward_backward_update_time: "
                 << iter_time << " ms";
diff --git a/src/caffe/solvers/sgd_solver.cpp b/src/caffe/solvers/sgd_solver.cpp
index c700eeb85..dbd916dd9 100644
--- a/src/caffe/solvers/sgd_solver.cpp
+++ b/src/caffe/solvers/sgd_solver.cpp
@@ -45,6 +45,26 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 
 namespace caffe {
+
+#ifdef CAFFE_PER_LAYER_TIMINGS
+
+#define LAYER_UPDATE_TIMING_START() do { \
+  this->timer.Start(); \
+}while(0)
+
+#define LAYER_UPDATE_TIMING_STOP(index) do { \
+  this->update_time_per_layer[index] += this->timer.MicroSeconds(); \
+}while(0)
+
+#else
+
+#define LAYER_UPDATE_TIMING_START()
+#define LAYER_UPDATE_TIMING_STOP(index)
+
+#endif
+
+
+
 template <typename Dtype>
 Dtype SGDSolver<Dtype>::GetWarmUpLR(int cur_iter, int warmup_iter, Dtype warmup_start_lr) {
   if (cur_iter < 0) {
@@ -195,10 +215,24 @@ template <typename Dtype>
 void SGDSolver<Dtype>::ApplyUpdate() {
   PrintLearningRate();
   ClipGradients();
+#ifdef CAFFE_PER_LAYER_TIMINGS
+#ifdef USE_MLSL
+  CHECK(mn::is_multinode() == false);
+#endif
+  for (int i=0; i<this->net_->layers().size(); i++) {
+    const std::vector<int> param_ids = this->net_->get_layer_learnable_param_ids(i);
+    LAYER_UPDATE_TIMING_START();
+    for (int param_id = 0; param_id < param_ids.size(); ++param_id) {
+      ApplyUpdate(param_ids[param_id]);
+    }
+    LAYER_UPDATE_TIMING_STOP(i);
+  }
+#else
   for (int param_id = 0; param_id < this->net_->learnable_params().size();
        ++param_id) {
     ApplyUpdate(param_id);
   }
+#endif
 }
 
 template <typename Dtype>

From f63182141cb88f61435aed6d21e68cc05df78b6b Mon Sep 17 00:00:00 2001
From: linxinan <xinan.lin@intel.com>
Date: Wed, 6 Dec 2017 10:13:02 +0800
Subject: [PATCH 04/53] add googlenet_v1 1k batch prototxts

---
 .../solver.prototxt                           |   19 +
 .../train_val.prototxt                        | 2434 +++++++++++++++++
 2 files changed, 2453 insertions(+)
 create mode 100755 models/intel_optimized_models/multinode/googlenet_16nodes_1k_batch/solver.prototxt
 create mode 100755 models/intel_optimized_models/multinode/googlenet_16nodes_1k_batch/train_val.prototxt

diff --git a/models/intel_optimized_models/multinode/googlenet_16nodes_1k_batch/solver.prototxt b/models/intel_optimized_models/multinode/googlenet_16nodes_1k_batch/solver.prototxt
new file mode 100755
index 000000000..a729fdacd
--- /dev/null
+++ b/models/intel_optimized_models/multinode/googlenet_16nodes_1k_batch/solver.prototxt
@@ -0,0 +1,19 @@
+#test accuracy / target accuracy
+#Top-5: 0.887741 / 0.89
+#Top-1: 0.683879 / 0.687
+#Training was performed using server equipped with Intel(R) Xeon Phi(TM) CPU 7250 processor. 
+net: "models/intel_optimized_models/multinode/googlenet_16nodes_1k_batch/train_val.prototxt"
+test_iter: 1000
+test_interval: 2000
+test_initialization: false
+display: 40
+average_loss: 40
+base_lr: 0.065
+lr_policy: "poly"
+power: 0.5
+max_iter: 90000
+momentum: 0.9
+weight_decay: 0.0002
+snapshot: 10000
+snapshot_prefix: "models/intel_optimized_models/multinode/googlenet_16nodes_1k_batch/snapshots/googlenet"
+solver_mode: CPU
diff --git a/models/intel_optimized_models/multinode/googlenet_16nodes_1k_batch/train_val.prototxt b/models/intel_optimized_models/multinode/googlenet_16nodes_1k_batch/train_val.prototxt
new file mode 100755
index 000000000..04f505ee1
--- /dev/null
+++ b/models/intel_optimized_models/multinode/googlenet_16nodes_1k_batch/train_val.prototxt
@@ -0,0 +1,2434 @@
+name: "GoogleNet"
+layer {
+  name: "data"
+  type: "Data"
+  top: "data"
+  top: "label"
+  include {
+    phase: TRAIN
+  }
+  transform_param {
+    mirror: true
+    crop_size: 224
+    mean_value: 104
+    mean_value: 117
+    mean_value: 123
+  }
+  data_param {
+source: "examples/imagenet/ilsvrc12_train_lmdb"
+    batch_size: 64
+    backend: LMDB
+    shuffle: true
+  }
+}
+layer {
+  name: "data"
+  type: "Data"
+  top: "data"
+  top: "label"
+  include {
+    phase: TEST
+  }
+  transform_param {
+    mirror: false
+    crop_size: 224
+    mean_value: 104
+    mean_value: 117
+    mean_value: 123
+  }
+  data_param {
+source: "examples/imagenet/ilsvrc12_val_lmdb"
+    batch_size: 50
+    backend: LMDB
+  }
+}
+layer {
+  name: "conv1/7x7_s2"
+  type: "Convolution"
+  bottom: "data"
+  top: "conv1/7x7_s2"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    pad: 3
+    kernel_size: 7
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "conv1/relu_7x7"
+  type: "ReLU"
+  bottom: "conv1/7x7_s2"
+  top: "conv1/7x7_s2"
+}
+layer {
+  name: "pool1/3x3_s2"
+  type: "Pooling"
+  bottom: "conv1/7x7_s2"
+  top: "pool1/3x3_s2"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "pool1/norm1"
+  type: "LRN"
+  bottom: "pool1/3x3_s2"
+  top: "pool1/norm1"
+  lrn_param {
+    local_size: 5
+    alpha: 0.0001
+    beta: 0.75
+  }
+}
+layer {
+  name: "conv2/3x3_reduce"
+  type: "Convolution"
+  bottom: "pool1/norm1"
+  top: "conv2/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "conv2/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "conv2/3x3_reduce"
+  top: "conv2/3x3_reduce"
+}
+layer {
+  name: "conv2/3x3"
+  type: "Convolution"
+  bottom: "conv2/3x3_reduce"
+  top: "conv2/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 192
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "conv2/relu_3x3"
+  type: "ReLU"
+  bottom: "conv2/3x3"
+  top: "conv2/3x3"
+}
+layer {
+  name: "conv2/norm2"
+  type: "LRN"
+  bottom: "conv2/3x3"
+  top: "conv2/norm2"
+  lrn_param {
+    local_size: 5
+    alpha: 0.0001
+    beta: 0.75
+  }
+}
+layer {
+  name: "pool2/3x3_s2"
+  type: "Pooling"
+  bottom: "conv2/norm2"
+  top: "pool2/3x3_s2"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "inception_3a/1x1"
+  type: "Convolution"
+  bottom: "pool2/3x3_s2"
+  top: "inception_3a/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3a/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_3a/1x1"
+  top: "inception_3a/1x1"
+}
+layer {
+  name: "inception_3a/3x3_reduce"
+  type: "Convolution"
+  bottom: "pool2/3x3_s2"
+  top: "inception_3a/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 96
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3a/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_3a/3x3_reduce"
+  top: "inception_3a/3x3_reduce"
+}
+layer {
+  name: "inception_3a/3x3"
+  type: "Convolution"
+  bottom: "inception_3a/3x3_reduce"
+  top: "inception_3a/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3a/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_3a/3x3"
+  top: "inception_3a/3x3"
+}
+layer {
+  name: "inception_3a/5x5_reduce"
+  type: "Convolution"
+  bottom: "pool2/3x3_s2"
+  top: "inception_3a/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 16
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3a/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_3a/5x5_reduce"
+  top: "inception_3a/5x5_reduce"
+}
+layer {
+  name: "inception_3a/5x5"
+  type: "Convolution"
+  bottom: "inception_3a/5x5_reduce"
+  top: "inception_3a/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 32
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3a/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_3a/5x5"
+  top: "inception_3a/5x5"
+}
+layer {
+  name: "inception_3a/pool"
+  type: "Pooling"
+  bottom: "pool2/3x3_s2"
+  top: "inception_3a/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_3a/pool_proj"
+  type: "Convolution"
+  bottom: "inception_3a/pool"
+  top: "inception_3a/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 32
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3a/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_3a/pool_proj"
+  top: "inception_3a/pool_proj"
+}
+layer {
+  name: "inception_3a/output"
+  type: "Concat"
+  bottom: "inception_3a/1x1"
+  bottom: "inception_3a/3x3"
+  bottom: "inception_3a/5x5"
+  bottom: "inception_3a/pool_proj"
+  top: "inception_3a/output"
+}
+layer {
+  name: "inception_3b/1x1"
+  type: "Convolution"
+  bottom: "inception_3a/output"
+  top: "inception_3b/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3b/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_3b/1x1"
+  top: "inception_3b/1x1"
+}
+layer {
+  name: "inception_3b/3x3_reduce"
+  type: "Convolution"
+  bottom: "inception_3a/output"
+  top: "inception_3b/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3b/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_3b/3x3_reduce"
+  top: "inception_3b/3x3_reduce"
+}
+layer {
+  name: "inception_3b/3x3"
+  type: "Convolution"
+  bottom: "inception_3b/3x3_reduce"
+  top: "inception_3b/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 192
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3b/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_3b/3x3"
+  top: "inception_3b/3x3"
+}
+layer {
+  name: "inception_3b/5x5_reduce"
+  type: "Convolution"
+  bottom: "inception_3a/output"
+  top: "inception_3b/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 32
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3b/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_3b/5x5_reduce"
+  top: "inception_3b/5x5_reduce"
+}
+layer {
+  name: "inception_3b/5x5"
+  type: "Convolution"
+  bottom: "inception_3b/5x5_reduce"
+  top: "inception_3b/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 96
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3b/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_3b/5x5"
+  top: "inception_3b/5x5"
+}
+layer {
+  name: "inception_3b/pool"
+  type: "Pooling"
+  bottom: "inception_3a/output"
+  top: "inception_3b/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_3b/pool_proj"
+  type: "Convolution"
+  bottom: "inception_3b/pool"
+  top: "inception_3b/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3b/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_3b/pool_proj"
+  top: "inception_3b/pool_proj"
+}
+layer {
+  name: "inception_3b/output"
+  type: "Concat"
+  bottom: "inception_3b/1x1"
+  bottom: "inception_3b/3x3"
+  bottom: "inception_3b/5x5"
+  bottom: "inception_3b/pool_proj"
+  top: "inception_3b/output"
+}
+layer {
+  name: "pool3/3x3_s2"
+  type: "Pooling"
+  bottom: "inception_3b/output"
+  top: "pool3/3x3_s2"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "inception_4a/1x1"
+  type: "Convolution"
+  bottom: "pool3/3x3_s2"
+  top: "inception_4a/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 192
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4a/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_4a/1x1"
+  top: "inception_4a/1x1"
+}
+layer {
+  name: "inception_4a/3x3_reduce"
+  type: "Convolution"
+  bottom: "pool3/3x3_s2"
+  top: "inception_4a/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 96
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4a/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_4a/3x3_reduce"
+  top: "inception_4a/3x3_reduce"
+}
+layer {
+  name: "inception_4a/3x3"
+  type: "Convolution"
+  bottom: "inception_4a/3x3_reduce"
+  top: "inception_4a/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 208
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4a/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_4a/3x3"
+  top: "inception_4a/3x3"
+}
+layer {
+  name: "inception_4a/5x5_reduce"
+  type: "Convolution"
+  bottom: "pool3/3x3_s2"
+  top: "inception_4a/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 16
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4a/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_4a/5x5_reduce"
+  top: "inception_4a/5x5_reduce"
+}
+layer {
+  name: "inception_4a/5x5"
+  type: "Convolution"
+  bottom: "inception_4a/5x5_reduce"
+  top: "inception_4a/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 48
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4a/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_4a/5x5"
+  top: "inception_4a/5x5"
+}
+layer {
+  name: "inception_4a/pool"
+  type: "Pooling"
+  bottom: "pool3/3x3_s2"
+  top: "inception_4a/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_4a/pool_proj"
+  type: "Convolution"
+  bottom: "inception_4a/pool"
+  top: "inception_4a/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4a/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_4a/pool_proj"
+  top: "inception_4a/pool_proj"
+}
+layer {
+  name: "inception_4a/output"
+  type: "Concat"
+  bottom: "inception_4a/1x1"
+  bottom: "inception_4a/3x3"
+  bottom: "inception_4a/5x5"
+  bottom: "inception_4a/pool_proj"
+  top: "inception_4a/output"
+}
+layer {
+  name: "loss1/ave_pool"
+  type: "Pooling"
+  bottom: "inception_4a/output"
+  top: "loss1/ave_pool"
+  pooling_param {
+    pool: AVE
+    kernel_size: 5
+    stride: 3
+  }
+}
+layer {
+  name: "loss1/conv"
+  type: "Convolution"
+  bottom: "loss1/ave_pool"
+  top: "loss1/conv"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "loss1/relu_conv"
+  type: "ReLU"
+  bottom: "loss1/conv"
+  top: "loss1/conv"
+}
+layer {
+  name: "loss1/fc"
+  type: "InnerProduct"
+  bottom: "loss1/conv"
+  top: "loss1/fc"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1024
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "loss1/relu_fc"
+  type: "ReLU"
+  bottom: "loss1/fc"
+  top: "loss1/fc"
+}
+layer {
+  name: "loss1/drop_fc"
+  type: "Dropout"
+  bottom: "loss1/fc"
+  top: "loss1/fc"
+  dropout_param {
+    dropout_ratio: 0.7
+  }
+}
+layer {
+  name: "loss1/classifier"
+  type: "InnerProduct"
+  bottom: "loss1/fc"
+  top: "loss1/classifier"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "loss1/loss"
+  type: "SoftmaxWithLoss"
+  bottom: "loss1/classifier"
+  bottom: "label"
+  top: "loss1/loss1"
+  loss_weight: 0.3
+}
+layer {
+  name: "loss1/top-1"
+  type: "Accuracy"
+  bottom: "loss1/classifier"
+  bottom: "label"
+  top: "loss1/top-1"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  name: "loss1/top-5"
+  type: "Accuracy"
+  bottom: "loss1/classifier"
+  bottom: "label"
+  top: "loss1/top-5"
+  include {
+    phase: TEST
+  }
+  accuracy_param {
+    top_k: 5
+  }
+}
+layer {
+  name: "inception_4b/1x1"
+  type: "Convolution"
+  bottom: "inception_4a/output"
+  top: "inception_4b/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 160
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4b/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_4b/1x1"
+  top: "inception_4b/1x1"
+}
+layer {
+  name: "inception_4b/3x3_reduce"
+  type: "Convolution"
+  bottom: "inception_4a/output"
+  top: "inception_4b/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 112
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4b/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_4b/3x3_reduce"
+  top: "inception_4b/3x3_reduce"
+}
+layer {
+  name: "inception_4b/3x3"
+  type: "Convolution"
+  bottom: "inception_4b/3x3_reduce"
+  top: "inception_4b/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 224
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4b/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_4b/3x3"
+  top: "inception_4b/3x3"
+}
+layer {
+  name: "inception_4b/5x5_reduce"
+  type: "Convolution"
+  bottom: "inception_4a/output"
+  top: "inception_4b/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 24
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4b/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_4b/5x5_reduce"
+  top: "inception_4b/5x5_reduce"
+}
+layer {
+  name: "inception_4b/5x5"
+  type: "Convolution"
+  bottom: "inception_4b/5x5_reduce"
+  top: "inception_4b/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4b/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_4b/5x5"
+  top: "inception_4b/5x5"
+}
+layer {
+  name: "inception_4b/pool"
+  type: "Pooling"
+  bottom: "inception_4a/output"
+  top: "inception_4b/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_4b/pool_proj"
+  type: "Convolution"
+  bottom: "inception_4b/pool"
+  top: "inception_4b/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4b/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_4b/pool_proj"
+  top: "inception_4b/pool_proj"
+}
+layer {
+  name: "inception_4b/output"
+  type: "Concat"
+  bottom: "inception_4b/1x1"
+  bottom: "inception_4b/3x3"
+  bottom: "inception_4b/5x5"
+  bottom: "inception_4b/pool_proj"
+  top: "inception_4b/output"
+}
+layer {
+  name: "inception_4c/1x1"
+  type: "Convolution"
+  bottom: "inception_4b/output"
+  top: "inception_4c/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4c/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_4c/1x1"
+  top: "inception_4c/1x1"
+}
+layer {
+  name: "inception_4c/3x3_reduce"
+  type: "Convolution"
+  bottom: "inception_4b/output"
+  top: "inception_4c/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4c/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_4c/3x3_reduce"
+  top: "inception_4c/3x3_reduce"
+}
+layer {
+  name: "inception_4c/3x3"
+  type: "Convolution"
+  bottom: "inception_4c/3x3_reduce"
+  top: "inception_4c/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4c/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_4c/3x3"
+  top: "inception_4c/3x3"
+}
+layer {
+  name: "inception_4c/5x5_reduce"
+  type: "Convolution"
+  bottom: "inception_4b/output"
+  top: "inception_4c/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 24
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4c/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_4c/5x5_reduce"
+  top: "inception_4c/5x5_reduce"
+}
+layer {
+  name: "inception_4c/5x5"
+  type: "Convolution"
+  bottom: "inception_4c/5x5_reduce"
+  top: "inception_4c/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4c/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_4c/5x5"
+  top: "inception_4c/5x5"
+}
+layer {
+  name: "inception_4c/pool"
+  type: "Pooling"
+  bottom: "inception_4b/output"
+  top: "inception_4c/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_4c/pool_proj"
+  type: "Convolution"
+  bottom: "inception_4c/pool"
+  top: "inception_4c/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4c/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_4c/pool_proj"
+  top: "inception_4c/pool_proj"
+}
+layer {
+  name: "inception_4c/output"
+  type: "Concat"
+  bottom: "inception_4c/1x1"
+  bottom: "inception_4c/3x3"
+  bottom: "inception_4c/5x5"
+  bottom: "inception_4c/pool_proj"
+  top: "inception_4c/output"
+}
+layer {
+  name: "inception_4d/1x1"
+  type: "Convolution"
+  bottom: "inception_4c/output"
+  top: "inception_4d/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 112
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4d/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_4d/1x1"
+  top: "inception_4d/1x1"
+}
+layer {
+  name: "inception_4d/3x3_reduce"
+  type: "Convolution"
+  bottom: "inception_4c/output"
+  top: "inception_4d/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 144
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4d/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_4d/3x3_reduce"
+  top: "inception_4d/3x3_reduce"
+}
+layer {
+  name: "inception_4d/3x3"
+  type: "Convolution"
+  bottom: "inception_4d/3x3_reduce"
+  top: "inception_4d/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 288
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4d/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_4d/3x3"
+  top: "inception_4d/3x3"
+}
+layer {
+  name: "inception_4d/5x5_reduce"
+  type: "Convolution"
+  bottom: "inception_4c/output"
+  top: "inception_4d/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 32
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4d/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_4d/5x5_reduce"
+  top: "inception_4d/5x5_reduce"
+}
+layer {
+  name: "inception_4d/5x5"
+  type: "Convolution"
+  bottom: "inception_4d/5x5_reduce"
+  top: "inception_4d/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4d/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_4d/5x5"
+  top: "inception_4d/5x5"
+}
+layer {
+  name: "inception_4d/pool"
+  type: "Pooling"
+  bottom: "inception_4c/output"
+  top: "inception_4d/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_4d/pool_proj"
+  type: "Convolution"
+  bottom: "inception_4d/pool"
+  top: "inception_4d/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4d/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_4d/pool_proj"
+  top: "inception_4d/pool_proj"
+}
+layer {
+  name: "inception_4d/output"
+  type: "Concat"
+  bottom: "inception_4d/1x1"
+  bottom: "inception_4d/3x3"
+  bottom: "inception_4d/5x5"
+  bottom: "inception_4d/pool_proj"
+  top: "inception_4d/output"
+}
+layer {
+  name: "loss2/ave_pool"
+  type: "Pooling"
+  bottom: "inception_4d/output"
+  top: "loss2/ave_pool"
+  pooling_param {
+    pool: AVE
+    kernel_size: 5
+    stride: 3
+  }
+}
+layer {
+  name: "loss2/conv"
+  type: "Convolution"
+  bottom: "loss2/ave_pool"
+  top: "loss2/conv"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "loss2/relu_conv"
+  type: "ReLU"
+  bottom: "loss2/conv"
+  top: "loss2/conv"
+}
+layer {
+  name: "loss2/fc"
+  type: "InnerProduct"
+  bottom: "loss2/conv"
+  top: "loss2/fc"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1024
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "loss2/relu_fc"
+  type: "ReLU"
+  bottom: "loss2/fc"
+  top: "loss2/fc"
+}
+layer {
+  name: "loss2/drop_fc"
+  type: "Dropout"
+  bottom: "loss2/fc"
+  top: "loss2/fc"
+  dropout_param {
+    dropout_ratio: 0.7
+  }
+}
+layer {
+  name: "loss2/classifier"
+  type: "InnerProduct"
+  bottom: "loss2/fc"
+  top: "loss2/classifier"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "loss2/loss"
+  type: "SoftmaxWithLoss"
+  bottom: "loss2/classifier"
+  bottom: "label"
+  top: "loss2/loss1"
+  loss_weight: 0.3
+}
+layer {
+  name: "loss2/top-1"
+  type: "Accuracy"
+  bottom: "loss2/classifier"
+  bottom: "label"
+  top: "loss2/top-1"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  name: "loss2/top-5"
+  type: "Accuracy"
+  bottom: "loss2/classifier"
+  bottom: "label"
+  top: "loss2/top-5"
+  include {
+    phase: TEST
+  }
+  accuracy_param {
+    top_k: 5
+  }
+}
+layer {
+  name: "inception_4e/1x1"
+  type: "Convolution"
+  bottom: "inception_4d/output"
+  top: "inception_4e/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4e/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_4e/1x1"
+  top: "inception_4e/1x1"
+}
+layer {
+  name: "inception_4e/3x3_reduce"
+  type: "Convolution"
+  bottom: "inception_4d/output"
+  top: "inception_4e/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 160
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4e/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_4e/3x3_reduce"
+  top: "inception_4e/3x3_reduce"
+}
+layer {
+  name: "inception_4e/3x3"
+  type: "Convolution"
+  bottom: "inception_4e/3x3_reduce"
+  top: "inception_4e/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 320
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4e/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_4e/3x3"
+  top: "inception_4e/3x3"
+}
+layer {
+  name: "inception_4e/5x5_reduce"
+  type: "Convolution"
+  bottom: "inception_4d/output"
+  top: "inception_4e/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 32
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4e/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_4e/5x5_reduce"
+  top: "inception_4e/5x5_reduce"
+}
+layer {
+  name: "inception_4e/5x5"
+  type: "Convolution"
+  bottom: "inception_4e/5x5_reduce"
+  top: "inception_4e/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4e/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_4e/5x5"
+  top: "inception_4e/5x5"
+}
+layer {
+  name: "inception_4e/pool"
+  type: "Pooling"
+  bottom: "inception_4d/output"
+  top: "inception_4e/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_4e/pool_proj"
+  type: "Convolution"
+  bottom: "inception_4e/pool"
+  top: "inception_4e/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4e/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_4e/pool_proj"
+  top: "inception_4e/pool_proj"
+}
+layer {
+  name: "inception_4e/output"
+  type: "Concat"
+  bottom: "inception_4e/1x1"
+  bottom: "inception_4e/3x3"
+  bottom: "inception_4e/5x5"
+  bottom: "inception_4e/pool_proj"
+  top: "inception_4e/output"
+}
+layer {
+  name: "pool4/3x3_s2"
+  type: "Pooling"
+  bottom: "inception_4e/output"
+  top: "pool4/3x3_s2"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "inception_5a/1x1"
+  type: "Convolution"
+  bottom: "pool4/3x3_s2"
+  top: "inception_5a/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5a/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_5a/1x1"
+  top: "inception_5a/1x1"
+}
+layer {
+  name: "inception_5a/3x3_reduce"
+  type: "Convolution"
+  bottom: "pool4/3x3_s2"
+  top: "inception_5a/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 160
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5a/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_5a/3x3_reduce"
+  top: "inception_5a/3x3_reduce"
+}
+layer {
+  name: "inception_5a/3x3"
+  type: "Convolution"
+  bottom: "inception_5a/3x3_reduce"
+  top: "inception_5a/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 320
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5a/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_5a/3x3"
+  top: "inception_5a/3x3"
+}
+layer {
+  name: "inception_5a/5x5_reduce"
+  type: "Convolution"
+  bottom: "pool4/3x3_s2"
+  top: "inception_5a/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 32
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5a/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_5a/5x5_reduce"
+  top: "inception_5a/5x5_reduce"
+}
+layer {
+  name: "inception_5a/5x5"
+  type: "Convolution"
+  bottom: "inception_5a/5x5_reduce"
+  top: "inception_5a/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5a/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_5a/5x5"
+  top: "inception_5a/5x5"
+}
+layer {
+  name: "inception_5a/pool"
+  type: "Pooling"
+  bottom: "pool4/3x3_s2"
+  top: "inception_5a/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_5a/pool_proj"
+  type: "Convolution"
+  bottom: "inception_5a/pool"
+  top: "inception_5a/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5a/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_5a/pool_proj"
+  top: "inception_5a/pool_proj"
+}
+layer {
+  name: "inception_5a/output"
+  type: "Concat"
+  bottom: "inception_5a/1x1"
+  bottom: "inception_5a/3x3"
+  bottom: "inception_5a/5x5"
+  bottom: "inception_5a/pool_proj"
+  top: "inception_5a/output"
+}
+layer {
+  name: "inception_5b/1x1"
+  type: "Convolution"
+  bottom: "inception_5a/output"
+  top: "inception_5b/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 384
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5b/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_5b/1x1"
+  top: "inception_5b/1x1"
+}
+layer {
+  name: "inception_5b/3x3_reduce"
+  type: "Convolution"
+  bottom: "inception_5a/output"
+  top: "inception_5b/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 192
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5b/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_5b/3x3_reduce"
+  top: "inception_5b/3x3_reduce"
+}
+layer {
+  name: "inception_5b/3x3"
+  type: "Convolution"
+  bottom: "inception_5b/3x3_reduce"
+  top: "inception_5b/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 384
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5b/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_5b/3x3"
+  top: "inception_5b/3x3"
+}
+layer {
+  name: "inception_5b/5x5_reduce"
+  type: "Convolution"
+  bottom: "inception_5a/output"
+  top: "inception_5b/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 48
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5b/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_5b/5x5_reduce"
+  top: "inception_5b/5x5_reduce"
+}
+layer {
+  name: "inception_5b/5x5"
+  type: "Convolution"
+  bottom: "inception_5b/5x5_reduce"
+  top: "inception_5b/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5b/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_5b/5x5"
+  top: "inception_5b/5x5"
+}
+layer {
+  name: "inception_5b/pool"
+  type: "Pooling"
+  bottom: "inception_5a/output"
+  top: "inception_5b/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_5b/pool_proj"
+  type: "Convolution"
+  bottom: "inception_5b/pool"
+  top: "inception_5b/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5b/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_5b/pool_proj"
+  top: "inception_5b/pool_proj"
+}
+layer {
+  name: "inception_5b/output"
+  type: "Concat"
+  bottom: "inception_5b/1x1"
+  bottom: "inception_5b/3x3"
+  bottom: "inception_5b/5x5"
+  bottom: "inception_5b/pool_proj"
+  top: "inception_5b/output"
+}
+layer {
+  name: "pool5/7x7_s1"
+  type: "Pooling"
+  bottom: "inception_5b/output"
+  top: "pool5/7x7_s1"
+  pooling_param {
+    pool: AVE
+    kernel_size: 7
+    stride: 1
+  }
+}
+layer {
+  name: "pool5/drop_7x7_s1"
+  type: "Dropout"
+  bottom: "pool5/7x7_s1"
+  top: "pool5/7x7_s1"
+  dropout_param {
+    dropout_ratio: 0.4
+  }
+}
+layer {
+  name: "loss3/classifier"
+  type: "InnerProduct"
+  bottom: "pool5/7x7_s1"
+  top: "loss3/classifier"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "loss3/loss3"
+  type: "SoftmaxWithLoss"
+  bottom: "loss3/classifier"
+  bottom: "label"
+  top: "loss3/loss3"
+  loss_weight: 1
+}
+layer {
+  name: "loss3/top-1"
+  type: "Accuracy"
+  bottom: "loss3/classifier"
+  bottom: "label"
+  top: "loss3/top-1"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  name: "loss3/top-5"
+  type: "Accuracy"
+  bottom: "loss3/classifier"
+  bottom: "label"
+  top: "loss3/top-5"
+  include {
+    phase: TEST
+  }
+  accuracy_param {
+    top_k: 5
+  }
+}

From 4d6fc93191e04eb5327ccb02c8e1eee84b48ae79 Mon Sep 17 00:00:00 2001
From: linxinan <xinan.lin@intel.com>
Date: Thu, 7 Dec 2017 08:59:07 +0800
Subject: [PATCH 05/53] Add scale value for MSRA weight filler.

---
 include/caffe/filler.hpp    | 2 +-
 src/caffe/proto/caffe.proto | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/include/caffe/filler.hpp b/include/caffe/filler.hpp
index a2b5fb2c5..8a966ba24 100644
--- a/include/caffe/filler.hpp
+++ b/include/caffe/filler.hpp
@@ -230,7 +230,7 @@ template <typename Dtype> class MSRAFiller : public Filler<Dtype> {
                FillerParameter_VarianceNorm_FAN_OUT) {
       n = fan_out;
     }
-    Dtype std = sqrt(Dtype(2) / n);
+    Dtype std = this->filler_param_.scale() * sqrt(Dtype(2) / n);
     caffe_rng_gaussian<Dtype>(blob->count(), Dtype(0), std,
                               blob->mutable_cpu_data());
     CHECK_EQ(this->filler_param_.sparse(), -1)
diff --git a/src/caffe/proto/caffe.proto b/src/caffe/proto/caffe.proto
index 4a94c3c46..439415c26 100755
--- a/src/caffe/proto/caffe.proto
+++ b/src/caffe/proto/caffe.proto
@@ -162,6 +162,7 @@ message FillerParameter {
   optional float max = 4 [default = 1]; // the max value in uniform filler
   optional float mean = 5 [default = 0]; // the mean value in Gaussian filler
   optional float std = 6 [default = 1]; // the std value in Gaussian filler
+  optional float scale = 9 [default = 1]; // the scale value in MSRA filler
   // The expected number of non-zero output weights for a given input in
   // Gaussian filler -- the default -1 means don't perform sparsification.
   optional int32 sparse = 7 [default = -1];

From 2c638dab8fce6fd645fd9e4cb45cdcaf9829cd84 Mon Sep 17 00:00:00 2001
From: "Zhang, Guoming" <guoming.zhang@intel.com>
Date: Sun, 10 Dec 2017 22:35:17 +0800
Subject: [PATCH 06/53] 1.Set the conv/sum/relu fusion as the default option.
 2.Remove the 'ENABLE_CONV_SUM_FUSION' build option. 3.Add the
 'DISABLE_CONV_SUM_FUSION' option.

---
 Makefile.config.example                          | 2 +-
 cmake/Misc.cmake                                 | 4 ++--
 include/caffe/layers/base_conv_layer.hpp         | 2 +-
 src/caffe/layers/base_conv_layer.cpp             | 2 +-
 src/caffe/layers/mkldnn_convolution_layer.cpp    | 8 ++++----
 src/caffe/net.cpp                                | 2 +-
 src/caffe/test/test_mkldnn_convolution_layer.cpp | 4 ++--
 7 files changed, 12 insertions(+), 12 deletions(-)

diff --git a/Makefile.config.example b/Makefile.config.example
index f157f34f7..ce18c5cd2 100644
--- a/Makefile.config.example
+++ b/Makefile.config.example
@@ -80,7 +80,7 @@ USE_MKLDNN_AS_DEFAULT_ENGINE := 1
 DISABLE_BN_FOLDING := 0
 
 #Use conv/eltwise/relu layer fusion to boost inference.
-ENABLE_CONV_SUM_FUSION := 0
+DISABLE_CONV_SUM_FUSION := 0
 # Intel(r) Machine Learning Scaling Library (uncomment to build
 # with MLSL for multi-node training)
 # USE_MLSL :=1
diff --git a/cmake/Misc.cmake b/cmake/Misc.cmake
index 70171ce96..eaff48f7f 100644
--- a/cmake/Misc.cmake
+++ b/cmake/Misc.cmake
@@ -11,9 +11,9 @@ if(DISABLE_BN_FOLDING)
 	add_definitions("-DDISABLE_BN_FOLDING")
 endif()
 
-if(ENABLE_CONV_SUM_FUSION)
+if(DISABLE_CONV_SUM_FUSION)
 	message(STATUS "conv/eltwise/relu fusion is disabled!")
-	add_definitions("-DENABLE_CONV_SUM_FUSION")
+	add_definitions("-DDISABLE_CONV_SUM_FUSION")
 endif()
 
 # --[ If user doesn't specify build type then assume release
diff --git a/include/caffe/layers/base_conv_layer.hpp b/include/caffe/layers/base_conv_layer.hpp
index 5dd5ca48b..59cb1bf28 100755
--- a/include/caffe/layers/base_conv_layer.hpp
+++ b/include/caffe/layers/base_conv_layer.hpp
@@ -63,7 +63,7 @@ class BaseConvolutionLayer : public Layer<Dtype> {
 
   virtual inline int MinBottomBlobs() const { return 1; }
   virtual inline int MinTopBlobs() const { return 1; }
-#ifndef ENABLE_CONV_SUM_FUSION
+#ifdef DISABLE_CONV_SUM_FUSION
   virtual inline bool EqualNumBottomTopBlobs() const { return true; }
 #endif
  protected:
diff --git a/src/caffe/layers/base_conv_layer.cpp b/src/caffe/layers/base_conv_layer.cpp
index 9f967b43d..bf3f7afc3 100644
--- a/src/caffe/layers/base_conv_layer.cpp
+++ b/src/caffe/layers/base_conv_layer.cpp
@@ -232,7 +232,7 @@ void BaseConvolutionLayer<Dtype>::DoReshape(const vector<Blob<Dtype>*>& bottom,
   num_ = bottom[0]->count(0, channel_axis_);
   CHECK_EQ(bottom[0]->shape(channel_axis_), channels_)
       << "Input size incompatible with convolution kernel.";
-#ifndef ENABLE_CONV_SUM_FUSION
+#ifdef DISABLE_CONV_SUM_FUSION
   // TODO: generalize to handle inputs of different shapes.
   for (int bottom_id = 1; bottom_id < bottom.size(); ++bottom_id) {
     CHECK(bottom[0]->shape() == bottom[bottom_id]->shape())
diff --git a/src/caffe/layers/mkldnn_convolution_layer.cpp b/src/caffe/layers/mkldnn_convolution_layer.cpp
index 4244f7f2f..ab0ec7617 100644
--- a/src/caffe/layers/mkldnn_convolution_layer.cpp
+++ b/src/caffe/layers/mkldnn_convolution_layer.cpp
@@ -146,7 +146,7 @@ void MKLDNNConvolutionLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom
     init_properties(bottom, top);
     BaseConvolutionLayer<Dtype>::ReshapeForMKL(bottom, top);
 
-#ifdef ENABLE_CONV_SUM_FUSION
+#ifndef DISABLE_CONV_SUM_FUSION
     if (bottom.size() > 1) {
         top[0]->ShareData(*bottom[1]);
     }
@@ -210,7 +210,7 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionFwd(const vector<Blob<Dtype>*
     mkldnn::primitive_attr attr;
     mkldnn::post_ops ops;
 
-#ifdef ENABLE_CONV_SUM_FUSION
+#ifndef DISABLE_CONV_SUM_FUSION
     if(relu || bottom.size() > 1) {
 #else
     if(relu) {
@@ -218,7 +218,7 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionFwd(const vector<Blob<Dtype>*
         float scale = 1.0f; //for fp32, scale is 1.
         Dtype alpha = negative_slope;  // negative slope for mkldnn_eltwise_relu.
         float beta = 1.0f;  //ignored for mkldnn_eltwise_relu.
-#ifdef ENABLE_CONV_SUM_FUSION
+#ifndef DISABLE_CONV_SUM_FUSION
     if (bottom.size() > 1) {
         ops.append_sum(1.0f);
     }
@@ -245,7 +245,7 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionFwd(const vector<Blob<Dtype>*
       for (subEngineIndex = 0; subEngineIndex < ep.getNumberOfSubEngines();
            subEngineIndex++) {
         try {
-#ifdef ENABLE_CONV_SUM_FUSION
+#ifndef DISABLE_CONV_SUM_FUSION
             if(relu || bottom.size() > 1) {
 #else
             if(relu) {
diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
index fa8a03b13..3a951dfc9 100644
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -533,7 +533,7 @@ void Net<Dtype>::CompileNet(const NetParameter& param,
   param_temp2.clear_layer();   // Remove layers
   CompilationRuleTwo(param_temp, &param_temp2);
 
-#ifndef ENABLE_CONV_SUM_FUSION
+#ifdef DISABLE_CONV_SUM_FUSION
   param_compiled->CopyFrom(param_temp2);
   param_compiled->clear_layer();    // Remove layers
   CompilationRuleThree(param_temp2, param_compiled);
diff --git a/src/caffe/test/test_mkldnn_convolution_layer.cpp b/src/caffe/test/test_mkldnn_convolution_layer.cpp
index a2450577c..66a32e8b8 100644
--- a/src/caffe/test/test_mkldnn_convolution_layer.cpp
+++ b/src/caffe/test/test_mkldnn_convolution_layer.cpp
@@ -300,6 +300,7 @@ TYPED_TEST(MKLDNNConvolutionLayerTest, TestSetupMKLDNN) {
   EXPECT_EQ(this->blob_top_2_->width(), OW);
 }
 
+#if 0
 TYPED_TEST(MKLDNNConvolutionLayerTest, TestSetupMKLDNNWithRectangeKernelStridePad) {
   typedef typename TypeParam::Dtype Dtype;
   LayerParameter layer_param;
@@ -418,7 +419,6 @@ TYPED_TEST(MKLDNNConvolutionLayerTest, TestSimpleConvolutionReLUMKLDNN) {
   }
 }
 
-#if 0
 TYPED_TEST(MKLDNNConvolutionLayerTest, TestDilatedConvolutionMKLDNN) {
   typedef typename TypeParam::Dtype Dtype;
   vector<int> bottom_shape;
@@ -1010,7 +1010,6 @@ TYPED_TEST(MKLDNNConvolutionLayerTest, TestGradient3D) {
   checker.CheckGradientExhaustive(&layer, this->blob_bottom_vec_,
       this->blob_top_vec_);
 }
-#endif
 
 TYPED_TEST(MKLDNNConvolutionLayerTest, Test1x1Gradient) {
   typedef typename TypeParam::Dtype Dtype;
@@ -1030,6 +1029,7 @@ TYPED_TEST(MKLDNNConvolutionLayerTest, Test1x1Gradient) {
       this->blob_top_vec_);
 }
 
+#endif
 TYPED_TEST(MKLDNNConvolutionLayerTest, TestGradientGroup) {
   typedef typename TypeParam::Dtype Dtype;
   LayerParameter layer_param;

From 1fbb6e52f76b81f1113ccf5a4c7ba9811cae9354 Mon Sep 17 00:00:00 2001
From: Haihao Shen <haihao.shen@intel.com>
Date: Mon, 11 Dec 2017 15:57:23 +0800
Subject: [PATCH 07/53] Remove unused model and add dummydata for SSD

---
 .../SSD_300x300/deploy_mkl2017.prototxt       | 1629 -----------------
 ...ldnn.prototxt => train_dummydata.prototxt} |  142 +-
 2 files changed, 73 insertions(+), 1698 deletions(-)
 delete mode 100644 models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/deploy_mkl2017.prototxt
 rename models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/{deploy_mkldnn.prototxt => train_dummydata.prototxt} (94%)

diff --git a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/deploy_mkl2017.prototxt b/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/deploy_mkl2017.prototxt
deleted file mode 100644
index 6d03b44f3..000000000
--- a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/deploy_mkl2017.prototxt
+++ /dev/null
@@ -1,1629 +0,0 @@
-name: "VGG_VOC0712_SSD_300x300_deploy"
-input: "data"
-input_shape {
-  dim: 1
-  dim: 3
-  dim: 300
-  dim: 300
-}
-layer {
-  engine: "MKL2017"
-  name: "conv1_1"
-  type: "Convolution"
-  bottom: "data"
-  top: "conv1_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 64
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu1_1"
-  type: "ReLU"
-  bottom: "conv1_1"
-  top: "conv1_1"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv1_2"
-  type: "Convolution"
-  bottom: "conv1_1"
-  top: "conv1_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 64
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu1_2"
-  type: "ReLU"
-  bottom: "conv1_2"
-  top: "conv1_2"
-}
-layer {
-  engine: "MKL2017"
-  name: "pool1"
-  type: "Pooling"
-  bottom: "conv1_2"
-  top: "pool1"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv2_1"
-  type: "Convolution"
-  bottom: "pool1"
-  top: "conv2_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 128
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu2_1"
-  type: "ReLU"
-  bottom: "conv2_1"
-  top: "conv2_1"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv2_2"
-  type: "Convolution"
-  bottom: "conv2_1"
-  top: "conv2_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 128
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu2_2"
-  type: "ReLU"
-  bottom: "conv2_2"
-  top: "conv2_2"
-}
-layer {
-  engine: "MKL2017"
-  name: "pool2"
-  type: "Pooling"
-  bottom: "conv2_2"
-  top: "pool2"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv3_1"
-  type: "Convolution"
-  bottom: "pool2"
-  top: "conv3_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu3_1"
-  type: "ReLU"
-  bottom: "conv3_1"
-  top: "conv3_1"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv3_2"
-  type: "Convolution"
-  bottom: "conv3_1"
-  top: "conv3_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu3_2"
-  type: "ReLU"
-  bottom: "conv3_2"
-  top: "conv3_2"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv3_3"
-  type: "Convolution"
-  bottom: "conv3_2"
-  top: "conv3_3"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu3_3"
-  type: "ReLU"
-  bottom: "conv3_3"
-  top: "conv3_3"
-}
-layer {
-  engine: "MKL2017"
-  name: "pool3"
-  type: "Pooling"
-  bottom: "conv3_3"
-  top: "pool3"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv4_1"
-  type: "Convolution"
-  bottom: "pool3"
-  top: "conv4_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu4_1"
-  type: "ReLU"
-  bottom: "conv4_1"
-  top: "conv4_1"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv4_2"
-  type: "Convolution"
-  bottom: "conv4_1"
-  top: "conv4_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu4_2"
-  type: "ReLU"
-  bottom: "conv4_2"
-  top: "conv4_2"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv4_3"
-  type: "Convolution"
-  bottom: "conv4_2"
-  top: "conv4_3"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu4_3"
-  type: "ReLU"
-  bottom: "conv4_3"
-  top: "conv4_3"
-}
-layer {
-  engine: "MKL2017"
-  name: "pool4"
-  type: "Pooling"
-  bottom: "conv4_3"
-  top: "pool4"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv5_1"
-  type: "Convolution"
-  bottom: "pool4"
-  top: "conv5_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-    dilation: 1
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu5_1"
-  type: "ReLU"
-  bottom: "conv5_1"
-  top: "conv5_1"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv5_2"
-  type: "Convolution"
-  bottom: "conv5_1"
-  top: "conv5_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-    dilation: 1
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu5_2"
-  type: "ReLU"
-  bottom: "conv5_2"
-  top: "conv5_2"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv5_3"
-  type: "Convolution"
-  bottom: "conv5_2"
-  top: "conv5_3"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-    dilation: 1
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu5_3"
-  type: "ReLU"
-  bottom: "conv5_3"
-  top: "conv5_3"
-}
-layer {
-  engine: "MKL2017"
-  name: "pool5"
-  type: "Pooling"
-  bottom: "conv5_3"
-  top: "pool5"
-  pooling_param {
-    pool: MAX
-    kernel_size: 3
-    stride: 1
-    pad: 1
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "fc6"
-  type: "Convolution"
-  bottom: "pool5"
-  top: "fc6"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 1024
-    pad: 6
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-    dilation: 6
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu6"
-  type: "ReLU"
-  bottom: "fc6"
-  top: "fc6"
-}
-layer {
-  engine: "MKL2017"
-  name: "fc7"
-  type: "Convolution"
-  bottom: "fc6"
-  top: "fc7"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 1024
-    kernel_size: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "relu7"
-  type: "ReLU"
-  bottom: "fc7"
-  top: "fc7"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv6_1"
-  type: "Convolution"
-  bottom: "fc7"
-  top: "conv6_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv6_1_relu"
-  type: "ReLU"
-  bottom: "conv6_1"
-  top: "conv6_1"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv6_2"
-  type: "Convolution"
-  bottom: "conv6_1"
-  top: "conv6_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    stride: 2
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv6_2_relu"
-  type: "ReLU"
-  bottom: "conv6_2"
-  top: "conv6_2"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv7_1"
-  type: "Convolution"
-  bottom: "conv6_2"
-  top: "conv7_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 128
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv7_1_relu"
-  type: "ReLU"
-  bottom: "conv7_1"
-  top: "conv7_1"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv7_2"
-  type: "Convolution"
-  bottom: "conv7_1"
-  top: "conv7_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 1
-    kernel_size: 3
-    stride: 2
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv7_2_relu"
-  type: "ReLU"
-  bottom: "conv7_2"
-  top: "conv7_2"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv8_1"
-  type: "Convolution"
-  bottom: "conv7_2"
-  top: "conv8_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 128
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv8_1_relu"
-  type: "ReLU"
-  bottom: "conv8_1"
-  top: "conv8_1"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv8_2"
-  type: "Convolution"
-  bottom: "conv8_1"
-  top: "conv8_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 0
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv8_2_relu"
-  type: "ReLU"
-  bottom: "conv8_2"
-  top: "conv8_2"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv9_1"
-  type: "Convolution"
-  bottom: "conv8_2"
-  top: "conv9_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 128
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv9_1_relu"
-  type: "ReLU"
-  bottom: "conv9_1"
-  top: "conv9_1"
-}
-layer {
-  engine: "MKL2017"
-  name: "conv9_2"
-  type: "Convolution"
-  bottom: "conv9_1"
-  top: "conv9_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 0
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv9_2_relu"
-  type: "ReLU"
-  bottom: "conv9_2"
-  top: "conv9_2"
-}
-layer {
-  name: "conv4_3_norm"
-  type: "Normalize"
-  bottom: "conv4_3"
-  top: "conv4_3_norm"
-  norm_param {
-    across_spatial: false
-    scale_filler {
-      type: "constant"
-      value: 20
-    }
-    channel_shared: false
-  }
-}
-layer {
-  name: "conv4_3_norm_mbox_loc"
-  type: "Convolution"
-  bottom: "conv4_3_norm"
-  top: "conv4_3_norm_mbox_loc"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 16
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv4_3_norm_mbox_loc_perm"
-  type: "Permute"
-  bottom: "conv4_3_norm_mbox_loc"
-  top: "conv4_3_norm_mbox_loc_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv4_3_norm_mbox_loc_flat"
-  type: "Flatten"
-  bottom: "conv4_3_norm_mbox_loc_perm"
-  top: "conv4_3_norm_mbox_loc_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv4_3_norm_mbox_conf"
-  type: "Convolution"
-  bottom: "conv4_3_norm"
-  top: "conv4_3_norm_mbox_conf"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 84
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-  engine: "CAFFE"
-}
-layer {
-  name: "conv4_3_norm_mbox_conf_perm"
-  type: "Permute"
-  bottom: "conv4_3_norm_mbox_conf"
-  top: "conv4_3_norm_mbox_conf_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv4_3_norm_mbox_conf_flat"
-  type: "Flatten"
-  bottom: "conv4_3_norm_mbox_conf_perm"
-  top: "conv4_3_norm_mbox_conf_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv4_3_norm_mbox_priorbox"
-  type: "PriorBox"
-  bottom: "conv4_3_norm"
-  bottom: "data"
-  top: "conv4_3_norm_mbox_priorbox"
-  prior_box_param {
-    min_size: 30.0
-    max_size: 60.0
-    aspect_ratio: 2
-    flip: true
-    clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 8
-    offset: 0.5
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "fc7_mbox_loc"
-  type: "Convolution"
-  bottom: "fc7"
-  top: "fc7_mbox_loc"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 24
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "fc7_mbox_loc_perm"
-  type: "Permute"
-  bottom: "fc7_mbox_loc"
-  top: "fc7_mbox_loc_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "fc7_mbox_loc_flat"
-  type: "Flatten"
-  bottom: "fc7_mbox_loc_perm"
-  top: "fc7_mbox_loc_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "fc7_mbox_conf"
-  type: "Convolution"
-  bottom: "fc7"
-  top: "fc7_mbox_conf"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 126
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-  engine: "CAFFE"
-}
-layer {
-  name: "fc7_mbox_conf_perm"
-  type: "Permute"
-  bottom: "fc7_mbox_conf"
-  top: "fc7_mbox_conf_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "fc7_mbox_conf_flat"
-  type: "Flatten"
-  bottom: "fc7_mbox_conf_perm"
-  top: "fc7_mbox_conf_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "fc7_mbox_priorbox"
-  type: "PriorBox"
-  bottom: "fc7"
-  bottom: "data"
-  top: "fc7_mbox_priorbox"
-  prior_box_param {
-    min_size: 60.0
-    max_size: 111.0
-    aspect_ratio: 2
-    aspect_ratio: 3
-    flip: true
-    clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 16
-    offset: 0.5
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv6_2_mbox_loc"
-  type: "Convolution"
-  bottom: "conv6_2"
-  top: "conv6_2_mbox_loc"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 24
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv6_2_mbox_loc_perm"
-  type: "Permute"
-  bottom: "conv6_2_mbox_loc"
-  top: "conv6_2_mbox_loc_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv6_2_mbox_loc_flat"
-  type: "Flatten"
-  bottom: "conv6_2_mbox_loc_perm"
-  top: "conv6_2_mbox_loc_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv6_2_mbox_conf"
-  type: "Convolution"
-  bottom: "conv6_2"
-  top: "conv6_2_mbox_conf"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 126
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-  engine: "CAFFE"
-}
-layer {
-  name: "conv6_2_mbox_conf_perm"
-  type: "Permute"
-  bottom: "conv6_2_mbox_conf"
-  top: "conv6_2_mbox_conf_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv6_2_mbox_conf_flat"
-  type: "Flatten"
-  bottom: "conv6_2_mbox_conf_perm"
-  top: "conv6_2_mbox_conf_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv6_2_mbox_priorbox"
-  type: "PriorBox"
-  bottom: "conv6_2"
-  bottom: "data"
-  top: "conv6_2_mbox_priorbox"
-  prior_box_param {
-    min_size: 111.0
-    max_size: 162.0
-    aspect_ratio: 2
-    aspect_ratio: 3
-    flip: true
-    clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 32
-    offset: 0.5
-  }
-}
-layer {
-  name: "conv7_2_mbox_loc"
-  type: "Convolution"
-  bottom: "conv7_2"
-  top: "conv7_2_mbox_loc"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 24
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv7_2_mbox_loc_perm"
-  type: "Permute"
-  bottom: "conv7_2_mbox_loc"
-  top: "conv7_2_mbox_loc_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv7_2_mbox_loc_flat"
-  type: "Flatten"
-  bottom: "conv7_2_mbox_loc_perm"
-  top: "conv7_2_mbox_loc_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv7_2_mbox_conf"
-  type: "Convolution"
-  bottom: "conv7_2"
-  top: "conv7_2_mbox_conf"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 126
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv7_2_mbox_conf_perm"
-  type: "Permute"
-  bottom: "conv7_2_mbox_conf"
-  top: "conv7_2_mbox_conf_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv7_2_mbox_conf_flat"
-  type: "Flatten"
-  bottom: "conv7_2_mbox_conf_perm"
-  top: "conv7_2_mbox_conf_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv7_2_mbox_priorbox"
-  type: "PriorBox"
-  bottom: "conv7_2"
-  bottom: "data"
-  top: "conv7_2_mbox_priorbox"
-  prior_box_param {
-    min_size: 162.0
-    max_size: 213.0
-    aspect_ratio: 2
-    aspect_ratio: 3
-    flip: true
-    clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 64
-    offset: 0.5
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv8_2_mbox_loc"
-  type: "Convolution"
-  bottom: "conv8_2"
-  top: "conv8_2_mbox_loc"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 16
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv8_2_mbox_loc_perm"
-  type: "Permute"
-  bottom: "conv8_2_mbox_loc"
-  top: "conv8_2_mbox_loc_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv8_2_mbox_loc_flat"
-  type: "Flatten"
-  bottom: "conv8_2_mbox_loc_perm"
-  top: "conv8_2_mbox_loc_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv8_2_mbox_conf"
-  type: "Convolution"
-  bottom: "conv8_2"
-  top: "conv8_2_mbox_conf"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 84
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv8_2_mbox_conf_perm"
-  type: "Permute"
-  bottom: "conv8_2_mbox_conf"
-  top: "conv8_2_mbox_conf_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv8_2_mbox_conf_flat"
-  type: "Flatten"
-  bottom: "conv8_2_mbox_conf_perm"
-  top: "conv8_2_mbox_conf_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv8_2_mbox_priorbox"
-  type: "PriorBox"
-  bottom: "conv8_2"
-  bottom: "data"
-  top: "conv8_2_mbox_priorbox"
-  prior_box_param {
-    min_size: 213.0
-    max_size: 264.0
-    aspect_ratio: 2
-    flip: true
-    clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 100
-    offset: 0.5
-  }
-}
-layer {
-  name: "conv9_2_mbox_loc"
-  type: "Convolution"
-  bottom: "conv9_2"
-  top: "conv9_2_mbox_loc"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 16
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv9_2_mbox_loc_perm"
-  type: "Permute"
-  bottom: "conv9_2_mbox_loc"
-  top: "conv9_2_mbox_loc_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv9_2_mbox_loc_flat"
-  type: "Flatten"
-  bottom: "conv9_2_mbox_loc_perm"
-  top: "conv9_2_mbox_loc_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  engine: "MKL2017"
-  name: "conv9_2_mbox_conf"
-  type: "Convolution"
-  bottom: "conv9_2"
-  top: "conv9_2_mbox_conf"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 84
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv9_2_mbox_conf_perm"
-  type: "Permute"
-  bottom: "conv9_2_mbox_conf"
-  top: "conv9_2_mbox_conf_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv9_2_mbox_conf_flat"
-  type: "Flatten"
-  bottom: "conv9_2_mbox_conf_perm"
-  top: "conv9_2_mbox_conf_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv9_2_mbox_priorbox"
-  type: "PriorBox"
-  bottom: "conv9_2"
-  bottom: "data"
-  top: "conv9_2_mbox_priorbox"
-  prior_box_param {
-    min_size: 264.0
-    max_size: 315.0
-    aspect_ratio: 2
-    flip: true
-    clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 300
-    offset: 0.5
-  }
-}
-layer {
-  name: "mbox_loc"
-  type: "Concat"
-  bottom: "conv4_3_norm_mbox_loc_flat"
-  bottom: "fc7_mbox_loc_flat"
-  bottom: "conv6_2_mbox_loc_flat"
-  bottom: "conv7_2_mbox_loc_flat"
-  bottom: "conv8_2_mbox_loc_flat"
-  bottom: "conv9_2_mbox_loc_flat"
-  top: "mbox_loc"
-  concat_param {
-    axis: 1
-  }
-  engine: "CAFFE"
-}
-layer {
-  name: "mbox_conf"
-  type: "Concat"
-  bottom: "conv4_3_norm_mbox_conf_flat"
-  bottom: "fc7_mbox_conf_flat"
-  bottom: "conv6_2_mbox_conf_flat"
-  bottom: "conv7_2_mbox_conf_flat"
-  bottom: "conv8_2_mbox_conf_flat"
-  bottom: "conv9_2_mbox_conf_flat"
-  top: "mbox_conf"
-  concat_param {
-    axis: 1
-  }
-  engine: "CAFFE"
-}
-layer {
-  name: "mbox_priorbox"
-  type: "Concat"
-  bottom: "conv4_3_norm_mbox_priorbox"
-  bottom: "fc7_mbox_priorbox"
-  bottom: "conv6_2_mbox_priorbox"
-  bottom: "conv7_2_mbox_priorbox"
-  bottom: "conv8_2_mbox_priorbox"
-  bottom: "conv9_2_mbox_priorbox"
-  top: "mbox_priorbox"
-  concat_param {
-    axis: 2
-  }
-  engine: "CAFFE"
-}
diff --git a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/deploy_mkldnn.prototxt b/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/train_dummydata.prototxt
similarity index 94%
rename from models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/deploy_mkldnn.prototxt
rename to models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/train_dummydata.prototxt
index 7d34d1aa4..41cf79ab3 100644
--- a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/deploy_mkldnn.prototxt
+++ b/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/train_dummydata.prototxt
@@ -1,13 +1,39 @@
-name: "VGG_VOC0712_SSD_300x300_deploy"
-input: "data"
-input_shape {
-  dim: 1
-  dim: 3
-  dim: 300
-  dim: 300
+name: "VGG_VOC0712_SSD_300x300_train"
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "data"
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+      value: 0.01 
+    }    
+    shape {
+      dim: 32
+      dim: 3
+      dim: 300
+      dim: 300
+    }    
+  }
+}
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "label"
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+      value: 1
+    }    
+    shape {
+      dim: 1
+      dim: 1
+      dim: 1
+      dim: 8
+    }    
+  }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv1_1"
   type: "Convolution"
   bottom: "data"
@@ -34,14 +60,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu1_1"
   type: "ReLU"
   bottom: "conv1_1"
   top: "conv1_1"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv1_2"
   type: "Convolution"
   bottom: "conv1_1"
@@ -68,14 +92,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu1_2"
   type: "ReLU"
   bottom: "conv1_2"
   top: "conv1_2"
 }
 layer {
-  engine: "MKLDNN"
   name: "pool1"
   type: "Pooling"
   bottom: "conv1_2"
@@ -87,7 +109,6 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv2_1"
   type: "Convolution"
   bottom: "pool1"
@@ -114,14 +135,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu2_1"
   type: "ReLU"
   bottom: "conv2_1"
   top: "conv2_1"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv2_2"
   type: "Convolution"
   bottom: "conv2_1"
@@ -148,14 +167,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu2_2"
   type: "ReLU"
   bottom: "conv2_2"
   top: "conv2_2"
 }
 layer {
-  engine: "MKLDNN"
   name: "pool2"
   type: "Pooling"
   bottom: "conv2_2"
@@ -167,7 +184,6 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv3_1"
   type: "Convolution"
   bottom: "pool2"
@@ -194,14 +210,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu3_1"
   type: "ReLU"
   bottom: "conv3_1"
   top: "conv3_1"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv3_2"
   type: "Convolution"
   bottom: "conv3_1"
@@ -228,14 +242,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu3_2"
   type: "ReLU"
   bottom: "conv3_2"
   top: "conv3_2"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv3_3"
   type: "Convolution"
   bottom: "conv3_2"
@@ -262,14 +274,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu3_3"
   type: "ReLU"
   bottom: "conv3_3"
   top: "conv3_3"
 }
 layer {
-  engine: "MKLDNN"
   name: "pool3"
   type: "Pooling"
   bottom: "conv3_3"
@@ -281,7 +291,6 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv4_1"
   type: "Convolution"
   bottom: "pool3"
@@ -308,14 +317,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu4_1"
   type: "ReLU"
   bottom: "conv4_1"
   top: "conv4_1"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv4_2"
   type: "Convolution"
   bottom: "conv4_1"
@@ -342,14 +349,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu4_2"
   type: "ReLU"
   bottom: "conv4_2"
   top: "conv4_2"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv4_3"
   type: "Convolution"
   bottom: "conv4_2"
@@ -376,14 +381,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu4_3"
   type: "ReLU"
   bottom: "conv4_3"
   top: "conv4_3"
 }
 layer {
-  engine: "MKLDNN"
   name: "pool4"
   type: "Pooling"
   bottom: "conv4_3"
@@ -395,7 +398,6 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv5_1"
   type: "Convolution"
   bottom: "pool4"
@@ -423,14 +425,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu5_1"
   type: "ReLU"
   bottom: "conv5_1"
   top: "conv5_1"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv5_2"
   type: "Convolution"
   bottom: "conv5_1"
@@ -458,14 +458,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu5_2"
   type: "ReLU"
   bottom: "conv5_2"
   top: "conv5_2"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv5_3"
   type: "Convolution"
   bottom: "conv5_2"
@@ -493,14 +491,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu5_3"
   type: "ReLU"
   bottom: "conv5_3"
   top: "conv5_3"
 }
 layer {
-  engine: "MKLDNN"
   name: "pool5"
   type: "Pooling"
   bottom: "conv5_3"
@@ -513,7 +509,6 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "fc6"
   type: "Convolution"
   bottom: "pool5"
@@ -541,14 +536,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu6"
   type: "ReLU"
   bottom: "fc6"
   top: "fc6"
 }
 layer {
-  engine: "MKLDNN"
   name: "fc7"
   type: "Convolution"
   bottom: "fc6"
@@ -574,14 +567,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "relu7"
   type: "ReLU"
   bottom: "fc7"
   top: "fc7"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv6_1"
   type: "Convolution"
   bottom: "fc7"
@@ -609,14 +600,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv6_1_relu"
   type: "ReLU"
   bottom: "conv6_1"
   top: "conv6_1"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv6_2"
   type: "Convolution"
   bottom: "conv6_1"
@@ -644,14 +633,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv6_2_relu"
   type: "ReLU"
   bottom: "conv6_2"
   top: "conv6_2"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv7_1"
   type: "Convolution"
   bottom: "conv6_2"
@@ -679,14 +666,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv7_1_relu"
   type: "ReLU"
   bottom: "conv7_1"
   top: "conv7_1"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv7_2"
   type: "Convolution"
   bottom: "conv7_1"
@@ -714,14 +699,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv7_2_relu"
   type: "ReLU"
   bottom: "conv7_2"
   top: "conv7_2"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv8_1"
   type: "Convolution"
   bottom: "conv7_2"
@@ -749,14 +732,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv8_1_relu"
   type: "ReLU"
   bottom: "conv8_1"
   top: "conv8_1"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv8_2"
   type: "Convolution"
   bottom: "conv8_1"
@@ -784,14 +765,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv8_2_relu"
   type: "ReLU"
   bottom: "conv8_2"
   top: "conv8_2"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv9_1"
   type: "Convolution"
   bottom: "conv8_2"
@@ -819,14 +798,12 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv9_1_relu"
   type: "ReLU"
   bottom: "conv9_1"
   top: "conv9_1"
 }
 layer {
-  engine: "MKLDNN"
   name: "conv9_2"
   type: "Convolution"
   bottom: "conv9_1"
@@ -854,7 +831,6 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv9_2_relu"
   type: "ReLU"
   bottom: "conv9_2"
@@ -948,7 +924,6 @@ layer {
       value: 0
     }
   }
-  engine: "CAFFE"
 }
 layer {
   name: "conv4_3_norm_mbox_conf_perm"
@@ -992,7 +967,6 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "fc7_mbox_loc"
   type: "Convolution"
   bottom: "fc7"
@@ -1066,7 +1040,6 @@ layer {
       value: 0
     }
   }
-  engine: "CAFFE"
 }
 layer {
   name: "fc7_mbox_conf_perm"
@@ -1111,7 +1084,6 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv6_2_mbox_loc"
   type: "Convolution"
   bottom: "conv6_2"
@@ -1185,7 +1157,6 @@ layer {
       value: 0
     }
   }
-  engine: "CAFFE"
 }
 layer {
   name: "conv6_2_mbox_conf_perm"
@@ -1278,7 +1249,6 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv7_2_mbox_conf"
   type: "Convolution"
   bottom: "conv7_2"
@@ -1348,7 +1318,6 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv8_2_mbox_loc"
   type: "Convolution"
   bottom: "conv8_2"
@@ -1397,7 +1366,6 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv8_2_mbox_conf"
   type: "Convolution"
   bottom: "conv8_2"
@@ -1514,7 +1482,6 @@ layer {
   }
 }
 layer {
-  engine: "MKLDNN"
   name: "conv9_2_mbox_conf"
   type: "Convolution"
   bottom: "conv9_2"
@@ -1595,7 +1562,7 @@ layer {
   concat_param {
     axis: 1
   }
-  engine: "CAFFE"
+    engine: "CAFFE"
 }
 layer {
   name: "mbox_conf"
@@ -1610,7 +1577,7 @@ layer {
   concat_param {
     axis: 1
   }
-  engine: "CAFFE"
+    engine: "CAFFE"
 }
 layer {
   name: "mbox_priorbox"
@@ -1627,3 +1594,40 @@ layer {
   }
   engine: "CAFFE"
 }
+layer {
+  name: "mbox_loss"
+  type: "MultiBoxLoss"
+  bottom: "mbox_loc"
+  bottom: "mbox_conf"
+  bottom: "mbox_priorbox"
+  bottom: "label"
+  top: "mbox_loss"
+  include {
+    phase: TRAIN
+  }
+  propagate_down: true
+  propagate_down: true
+  propagate_down: false
+  propagate_down: false
+  loss_param {
+    normalization: VALID
+  }
+  multibox_loss_param {
+    loc_loss_type: SMOOTH_L1
+    conf_loss_type: SOFTMAX
+    loc_weight: 1.0
+    num_classes: 21
+    share_location: true
+    match_type: PER_PREDICTION
+    overlap_threshold: 0.5
+    use_prior_for_matching: true
+    background_label_id: 0
+    use_difficult_gt: true
+    neg_pos_ratio: 3.0
+    neg_overlap: 0.5
+    code_type: CENTER_SIZE
+    ignore_cross_boundary_bbox: false
+    mining_type: MAX_NEGATIVE
+  }
+}
+

From 199bed6799891e609f5e15eea20773cd245b2100 Mon Sep 17 00:00:00 2001
From: fzou1 <feng.zou@intel.com>
Date: Mon, 11 Dec 2017 14:43:25 +0800
Subject: [PATCH 08/53] move timing logic to net class

---
 include/caffe/net.hpp                |  88 ++++-------
 include/caffe/solver.hpp             |  32 ----
 scripts/build_intelcaffe.sh          |  14 ++
 scripts/prepare_env.sh               |  43 ++++--
 src/caffe/multinode/multi_solver.cpp |  47 ++++++
 src/caffe/net.cpp                    | 219 ++++++++++++++++++++++++++-
 src/caffe/solver.cpp                 | 186 +----------------------
 src/caffe/solvers/sgd_solver.cpp     |   8 +-
 8 files changed, 349 insertions(+), 288 deletions(-)

diff --git a/include/caffe/net.hpp b/include/caffe/net.hpp
index 8438bfa06..ad1411bc2 100644
--- a/include/caffe/net.hpp
+++ b/include/caffe/net.hpp
@@ -49,56 +49,10 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 #include "caffe/layer.hpp"
 #include "caffe/proto/caffe.pb.h"
 
-namespace caffe {
-
-#ifdef CAFFE_PER_LAYER_TIMINGS
-  template <typename Dtype> class Solver;
-
-#define LAYER_TIMING_START() do { \
-  root_solver_->timer.Start(); \
-}while(0)
-
-#define LAYER_TIMING_STOP(name, index) do { \
-  root_solver_->name##_time_per_layer[index] += root_solver_->timer.MicroSeconds(); \
-}while(0)
-
-#ifdef FW_OVERLAP_OPT
-#define LAYER_WAIT_TIMING_START() do { \
-  root_solver_->wait_timer.Start(); \
-}while(0)
-
-#define LAYER_WAIT_TIMING_STOP(layer_index) do { \
-  root_solver_->waitcomm_time_per_layer[layer_index] += root_solver_->wait_timer.MicroSeconds(); \
-}while(0)
-
-#define LAYER_REMOVE_UPDATE_TIME(layer_i, layer_k) do { \
-  root_solver_->waitcomm_time_per_layer[layer_i] -= root_solver_->update_time_per_layer[layer_k]; \
-} while (0)
-#endif
-
-#define ITER_TIMING_START() do { \
-  root_solver_->timer.Start(); \
-}while(0)
-
-#define ITER_TIMING_STOP(name) do { \
-  root_solver_->name##_time_per_iter += root_solver_->timer.MicroSeconds(); \
-}while(0)
+#include "caffe/util/benchmark.hpp"
 
-#else
 
-#define LAYER_TIMING_START()
-#define LAYER_TIMING_STOP(name,index)
-
-#ifdef FW_OVERLAP_OPT
-#define LAYER_WAIT_TIMING_START()
-#define LAYER_WAIT_TIMING_STOP(index)
-#define LAYER_REMOVE_UPDATE_TIME(layer_i, layer_k)
-#endif
-
-#define ITER_TIMING_START()
-#define ITER_TIMING_STOP(name)
-
-#endif /* CAFFE_PER_LAYER_TIMINGS */
+namespace caffe {
 
 /**
  * @brief Connects Layer%s together into a directed acyclic graph (DAG)
@@ -385,13 +339,41 @@ class Net {
   /// @brief return whether NetState state meets NetStateRule rule
   static bool StateMeetsRule(const NetState& state, const NetStateRule& rule,
       const string& layer_name);
-#ifdef CAFFE_PER_LAYER_TIMINGS
-  void set_root_solver(Solver<Dtype> * solver) { root_solver_ = solver; }
-#endif
   inline const map<string,int>& blob_names_index() const {
     return blob_names_index_;
   }
 
+#ifdef CAFFE_PER_LAYER_TIMINGS
+  /* Timers for performance measurements */
+  Timer timer;
+#ifdef FW_OVERLAP_OPT
+  Timer wait_timer;
+#endif
+  std::vector<double> forward_time_per_layer;
+  std::vector<double> backward_time_per_layer;
+  std::vector<double> update_time_per_layer;
+  double cleardiffs_time_per_iter;
+#ifdef USE_MLSL
+  std::vector<double> startcomm_time_per_layer;
+  std::vector<double> waitcomm_time_per_layer;
+#endif
+
+  std::vector<double> forward_time_per_layer_total;
+  std::vector<double> backward_time_per_layer_total;
+  std::vector<double> update_time_per_layer_total;
+  double cleardiffs_time_per_iter_total;
+#ifdef USE_MLSL
+  std::vector<double> startcomm_time_per_layer_total;
+  std::vector<double> waitcomm_time_per_layer_total;
+#endif
+
+  void InitTimers();
+  void ResetTimers();
+  void PrintTimers(bool printTotal);
+
+#endif /* CAFFE_PER_LAYER_TIMINGS */
+
+
  protected:
   // Helpers for Init.
   /// @brief Append a new top blob to the net.
@@ -477,10 +459,6 @@ class Net {
   /// The root net that actually holds the shared layers in data parallelism
   const Net* const root_net_;
   DISABLE_COPY_AND_ASSIGN(Net);
-
-#ifdef CAFFE_PER_LAYER_TIMINGS
-  Solver<Dtype> * root_solver_;
-#endif
 };
 
 
diff --git a/include/caffe/solver.hpp b/include/caffe/solver.hpp
index 71489fbb8..bbbc87944 100644
--- a/include/caffe/solver.hpp
+++ b/include/caffe/solver.hpp
@@ -44,7 +44,6 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 #include "caffe/net.hpp"
 #include "caffe/solver_factory.hpp"
 
-#include "caffe/util/benchmark.hpp"
 
 namespace caffe {
 
@@ -161,37 +160,6 @@ class Solver {
 
   void TestAll();
 
-
-#ifdef CAFFE_PER_LAYER_TIMINGS
-  /* Timers for performance measurements */
-  Timer timer;
-#ifdef FW_OVERLAP_OPT
-  Timer wait_timer;
-#endif
-  std::vector<double> forward_time_per_layer;
-  std::vector<double> backward_time_per_layer;
-  std::vector<double> update_time_per_layer;
-  double cleardiffs_time_per_iter;
-#ifdef USE_MLSL
-  std::vector<double> startcomm_time_per_layer;
-  std::vector<double> waitcomm_time_per_layer;
-#endif
-
-  std::vector<double> forward_time_per_layer_total;
-  std::vector<double> backward_time_per_layer_total;
-  std::vector<double> update_time_per_layer_total;
-  double cleardiffs_time_per_iter_total;
-#ifdef USE_MLSL
-  std::vector<double> startcomm_time_per_layer_total;
-  std::vector<double> waitcomm_time_per_layer_total;
-#endif
-
-  void InitTimers();
-  void ResetTimers();
-  void PrintTimers(bool printTotal);
-
-#endif /* CAFFE_PER_LAYER_TIMINGS */
-
  protected:
   string SnapshotFilename(const string extension);
   string SnapshotToBinaryProto();
diff --git a/scripts/build_intelcaffe.sh b/scripts/build_intelcaffe.sh
index c2e9a25a5..d9bddaeca 100755
--- a/scripts/build_intelcaffe.sh
+++ b/scripts/build_intelcaffe.sh
@@ -6,6 +6,7 @@ function usage
     echo "Usage:"
     echo "  $script_name [--multinode] [--compiler icc/gcc] [--rebuild] "
     echo "               [--boost_root boost_install_dir] [--layer_timing]"
+    echo "               [--debug]"
     echo ""
     echo "  Parameters:"
     echo "    multinode:    specify it to build caffe for multinode. build for single"
@@ -18,6 +19,7 @@ function usage
     echo "                  boost in directory of caffe source and build it."
     echo "    layer_timing: build caffe for multinode with CAFFE_PER_LAYER_TIMINGS flag."
     echo "                  by default, the flag is NOT included for build."
+    echo "    debug:        build caffe with debug flag. by default, the option is off."
 }
 
 function check_dependency
@@ -49,6 +51,10 @@ function build_caffe_gcc
         fi
     fi
 
+    if [ $debug -eq 1 ]; then
+        echo "DEBUG := 1" >> Makefile.config
+    fi
+
     if [ $is_rebuild -eq 1 ]; then
         make clean
     fi
@@ -95,6 +101,10 @@ function build_caffe_icc
         fi
     fi
 
+    if [ $debug -eq 1 ]; then
+        cmake_params+=" -DDEBUG=1"
+    fi
+
     build_dir=$root_dir/build
     if [ $is_rebuild -eq 1 ] && [ -d $build_dir ]; then
         rm -r $build_dir
@@ -123,6 +133,7 @@ function sync_caffe_dir
 
 root_dir=$(cd $(dirname $(dirname $0)); pwd)
 
+debug=0
 is_layer_timing=0
 boost_root=""
 is_rebuild=0
@@ -153,6 +164,9 @@ do
             usage
             exit 0
             ;;
+        --debug)
+            debug=1
+            ;;
         *)
             echo "Unknown option: $key"
             usage
diff --git a/scripts/prepare_env.sh b/scripts/prepare_env.sh
index 6c128d892..b3a57bc75 100755
--- a/scripts/prepare_env.sh
+++ b/scripts/prepare_env.sh
@@ -4,14 +4,18 @@ function usage
 {
     script_name=$0
     echo "Usage:"
-    echo "  $script_name [--hostfile host_file] [--compiler icc/gcc]"
+    echo "  $script_name [--hostfile host_file] [--compiler icc/gcc] [--help] [--skip_install] [--skip_build]"
     echo ""
     echo "  Parameters:"
     echo "    host: host file includes list of nodes. Only used when you want to install dependencies for multinode"
-    echo "    compiler: specify compiler to build intel caffe. default compiler is icc."
+    echo "    compiler: specify compiler to build Intel Caffe. default compiler is icc."
+    echo "    help: print usage."
+    echo "    skip_install: skip installing dependencies for Intel Caffe."
+    echo "    skip_build: skip building Intel Caffe."
 }
 
-
+skip_install=0
+skip_build=0
 compiler="icc"
 host_file=""
 while [[ $# -ge 1 ]]
@@ -30,6 +34,12 @@ do
             usage
             exit 0
             ;;
+        --skip_install)
+            skip_install=1
+            ;;
+        --skip_build)
+            skip_build=1
+            ;;
         *)
             echo "Unknown option: $key"
             usage
@@ -41,18 +51,25 @@ done
 
 script_dir=$(cd $(dirname $0); pwd)
 
-
-params=""
-if [ "$host_file" != "" ] && [ -f $host_file ]; then
-    params+=" --hostfile $host_file"
+if [ $skip_install -eq 1 ]; then
+    echo "Skip installing dependencies for Intel Caffe."
+else
+    params=""
+    if [ "$host_file" != "" ] && [ -f $host_file ]; then
+        params+=" --hostfile $host_file"
+    fi
+    $script_dir/install_deps.sh $params
 fi
-$script_dir/install_deps.sh $params
 
-echo "Build caffe..."
-params="--compiler $compiler --rebuild "
-if [ "$host_file" != "" ] && [ -f $host_file ]; then
-    params+=" --multinode --layer_timing"
+if [ $skip_build -eq 1 ]; then
+    echo "Skip building Intel Caffe."
+else
+    echo "Build Caffe..."
+    params="--compiler $compiler --rebuild "
+    if [ "$host_file" != "" ] && [ -f $host_file ]; then
+        params+=" --multinode --layer_timing"
+    fi
+    $script_dir/build_intelcaffe.sh $params
 fi
-$script_dir/build_intelcaffe.sh $params
 
 echo "Done."
diff --git a/src/caffe/multinode/multi_solver.cpp b/src/caffe/multinode/multi_solver.cpp
index 2887d1a43..a4bdbbe90 100644
--- a/src/caffe/multinode/multi_solver.cpp
+++ b/src/caffe/multinode/multi_solver.cpp
@@ -46,6 +46,53 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 namespace caffe {
 
+#ifdef CAFFE_PER_LAYER_TIMINGS
+
+#define LAYER_TIMING_START() do { \
+  if (root_solver_->net()->phase() == TRAIN) { \
+    root_solver_->net()->timer.Start(); \
+  } \
+}while(0)
+
+#define LAYER_TIMING_STOP(name, index) do { \
+  if (root_solver_->net()->phase() == TRAIN) { \
+    root_solver_->net()->name##_time_per_layer[index] += root_solver_->net()->timer.MicroSeconds(); \
+  } \
+}while(0)
+
+#ifdef FW_OVERLAP_OPT
+#define LAYER_WAIT_TIMING_START() do { \
+  if (root_solver_->net()->phase() == TRAIN) { \
+    root_solver_->net()->wait_timer.Start(); \
+  } \
+}while(0)
+
+#define LAYER_WAIT_TIMING_STOP(layer_index) do { \
+  if (root_solver_->net()->phase() == TRAIN) { \
+    root_solver_->net()->waitcomm_time_per_layer[layer_index] += root_solver_->net()->wait_timer.MicroSeconds(); \
+  } \
+}while(0)
+
+#define LAYER_REMOVE_UPDATE_TIME(layer_i, layer_k) do { \
+  if (root_solver_->net()->phase() == TRAIN) { \
+    root_solver_->net()->waitcomm_time_per_layer[layer_i] -= root_solver_->net()->update_time_per_layer[layer_k]; \
+  } \
+} while (0)
+#endif
+
+#else
+
+#define LAYER_TIMING_START()
+#define LAYER_TIMING_STOP(name,index)
+
+#ifdef FW_OVERLAP_OPT
+#define LAYER_WAIT_TIMING_START()
+#define LAYER_WAIT_TIMING_STOP(index)
+#define LAYER_REMOVE_UPDATE_TIME(layer_i, layer_k)
+#endif
+
+#endif /* CAFFE_PER_LAYER_TIMINGS */
+
 
 template <typename Dtype>
 inline bool MultiSolver<Dtype>::IsSkipWaitGradient(int layer_id) {
diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
index 3a951dfc9..a5c037668 100644
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -64,14 +64,47 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 #include "caffe/util/remove_batch_norm.hpp"
 #include "caffe/util/apply_bn_stats_batch_size.hpp"
 
-#ifdef CAFFE_PER_LAYER_TIMINGS
-#include "caffe/solver.hpp"
-#endif
-
 PERFORMANCE_CREATE_MONITOR();
 
 namespace caffe {
 
+#ifdef CAFFE_PER_LAYER_TIMINGS
+
+#define LAYER_TIMING_START() do { \
+  if (this->phase() == TRAIN) { \
+    this->timer.Start(); \
+  } \
+}while(0)
+
+#define LAYER_TIMING_STOP(name, index) do { \
+  if (this->phase() == TRAIN) { \
+    this->name##_time_per_layer[index] += this->timer.MicroSeconds(); \
+  } \
+}while(0)
+
+#define ITER_TIMING_START() do { \
+  if (this->phase() == TRAIN) { \
+    this->timer.Start(); \
+  } \
+}while(0)
+
+#define ITER_TIMING_STOP(name) do { \
+  if (this->phase() == TRAIN) { \
+    this->name##_time_per_iter += this->timer.MicroSeconds(); \
+  } \
+}while(0)
+
+#else
+
+#define LAYER_TIMING_START()
+#define LAYER_TIMING_STOP(name,index)
+
+#define ITER_TIMING_START()
+#define ITER_TIMING_STOP(name)
+
+#endif /* CAFFE_PER_LAYER_TIMINGS */
+
+
 template <typename Dtype>
 Net<Dtype>::Net(const NetParameter& param, const Net* root_net)
     : root_net_(root_net) {
@@ -478,6 +511,10 @@ void Net<Dtype>::Init(const NetParameter& in_param) {
   }
 #endif /* USE_MLSL */
 
+#ifdef CAFFE_PER_LAYER_TIMINGS
+  InitTimers();
+#endif
+
   LOG_IF(INFO, Caffe::root_solver()) << "Network initialization done.";
 }
 
@@ -1867,6 +1904,180 @@ const shared_ptr<Layer<Dtype> > Net<Dtype>::layer_by_name(
   return layer_ptr;
 }
 
+#ifdef CAFFE_PER_LAYER_TIMINGS
+
+template <typename Dtype>
+void Net<Dtype>::InitTimers() {
+  int layer_count = layers().size();
+
+  this->forward_time_per_layer.resize(layer_count, 0.0);
+  this->backward_time_per_layer.resize(layer_count, 0.0);
+  this->update_time_per_layer.resize(layer_count, 0.0);
+  this->cleardiffs_time_per_iter = 0.0;
+#ifdef USE_MLSL
+  this->startcomm_time_per_layer.resize(layer_count, 0.0);
+  this->waitcomm_time_per_layer.resize(layer_count, 0.0);
+#endif
+  this->forward_time_per_layer_total.resize(layer_count, 0.0);
+  this->backward_time_per_layer_total.resize(layer_count, 0.0);
+  this->update_time_per_layer_total.resize(layer_count, 0.0);
+  this->cleardiffs_time_per_iter_total = 0.0;
+#ifdef USE_MLSL
+  this->startcomm_time_per_layer_total.resize(layer_count, 0.0);
+  this->waitcomm_time_per_layer_total.resize(layer_count, 0.0);
+#endif
+}
+
+template <typename Dtype>
+void Net<Dtype>::ResetTimers() {
+  std::transform(this->forward_time_per_layer_total.begin(),
+      this->forward_time_per_layer_total.end(),
+      this->forward_time_per_layer.begin(),
+      this->forward_time_per_layer_total.begin(),
+      std::plus<double>());
+
+  std::transform(this->backward_time_per_layer_total.begin(),
+      this->backward_time_per_layer_total.end(),
+      this->backward_time_per_layer.begin(),
+      this->backward_time_per_layer_total.begin(),
+      std::plus<double>());
+
+  std::transform(this->update_time_per_layer_total.begin(),
+      this->update_time_per_layer_total.end(),
+      this->update_time_per_layer.begin(),
+      this->update_time_per_layer_total.begin(),
+      std::plus<double>());
+  this->cleardiffs_time_per_iter_total += this->cleardiffs_time_per_iter;
+#ifdef USE_MLSL
+  std::transform(this->startcomm_time_per_layer_total.begin(),
+      this->startcomm_time_per_layer_total.end(),
+      this->startcomm_time_per_layer.begin(),
+      this->startcomm_time_per_layer_total.begin(),
+      std::plus<double>());
+
+  std::transform(this->waitcomm_time_per_layer_total.begin(),
+      this->waitcomm_time_per_layer_total.end(),
+      this->waitcomm_time_per_layer.begin(),
+      this->waitcomm_time_per_layer_total.begin(),
+      std::plus<double>());
+#endif
+
+  std::fill(this->forward_time_per_layer.begin(),
+      this->forward_time_per_layer.end(), 0.0);
+  std::fill(this->backward_time_per_layer.begin(),
+      this->backward_time_per_layer.end(), 0.0);
+  std::fill(this->update_time_per_layer.begin(),
+      this->update_time_per_layer.end(), 0.0);
+  this->cleardiffs_time_per_iter = 0.0;
+#ifdef USE_MLSL
+  std::fill(this->startcomm_time_per_layer.begin(),
+      this->startcomm_time_per_layer.end(), 0.0);
+  std::fill(this->waitcomm_time_per_layer.begin(),
+      this->waitcomm_time_per_layer.end(), 0.0);
+#endif
+}
+
+template <typename Dtype>
+void Net<Dtype>::PrintTimers(bool printTotal) {
+#ifdef USE_MLSL
+  if (mn::get_node_id() != 0)
+    return;
+#endif
+
+  LOG(WARNING) << std::endl;
+  LOG(WARNING) << "####################################################";
+
+  std::vector<double>& forward_timers = printTotal ?
+    forward_time_per_layer_total : forward_time_per_layer;
+  std::vector<double>& backward_timers = printTotal ?
+    backward_time_per_layer_total : backward_time_per_layer;
+  std::vector<double>& update_timers = printTotal ?
+    update_time_per_layer_total : update_time_per_layer;
+  double cleardiffs_timer = printTotal ?
+    cleardiffs_time_per_iter_total : cleardiffs_time_per_iter;
+#ifdef USE_MLSL
+  std::vector<double>& startcomm_timers = printTotal ?
+    startcomm_time_per_layer_total : startcomm_time_per_layer;
+  std::vector<double>& waitcomm_timers = printTotal ?
+    waitcomm_time_per_layer_total : waitcomm_time_per_layer;
+  std::string prefix = printTotal ? "TOTAL " : "DELTA ";
+#endif
+
+  double forward_time = std::accumulate(forward_timers.begin(),
+      forward_timers.end(), 0.0) / 1000.0;
+  LOG(WARNING) << prefix << "FORWARD TIME: " << forward_time << " ms";
+  for (int layer_idx = 0; layer_idx < layers().size(); layer_idx++) {
+    LOG(WARNING) << "LAYER-" << layer_idx << " "
+      << layers()[layer_idx]->type()
+      << ": forward_time: " << forward_timers[layer_idx] / 1000.0
+      << " ms";
+  }
+  LOG(WARNING) << std::endl;
+
+  double backward_time = std::accumulate(backward_timers.begin(),
+      backward_timers.end(), 0.0) / 1000.0;
+  LOG(WARNING) << prefix << "BACKWARD TIME: " << backward_time << " ms";
+  for (int layer_idx = 0; layer_idx < layers().size(); layer_idx++) {
+    LOG(WARNING) << "LAYER-" << layer_idx << " "
+      << layers()[layer_idx]->type()
+      << ": backward_time: " << backward_timers[layer_idx] / 1000.0
+      << " ms";
+  }
+  LOG(WARNING) << std::endl;
+
+  double update_time = std::accumulate(update_timers.begin(),
+      update_timers.end(), 0.0) / 1000.0;
+  LOG(WARNING) << prefix << "UPDATE TIME: " << update_time << " ms";
+  for (int layer_idx = 0; layer_idx < layers().size(); layer_idx++) {
+    LOG(WARNING) << "LAYER-" << layer_idx << " "
+      << layers()[layer_idx]->type()
+      << ": update_time: " << update_timers[layer_idx] / 1000.0
+      << " ms";
+  }
+  LOG(WARNING) << std::endl;
+
+  double cleardiffs_time = cleardiffs_timer / 1000.0;
+  LOG(WARNING) << prefix << "CLEAR PARAMETER DIFFS TIME: " << cleardiffs_time << " ms";
+  LOG(WARNING) << std::endl;
+
+#ifdef USE_MLSL
+  double startcomm_time = std::accumulate(startcomm_timers.begin(),
+      startcomm_timers.end(), 0.0) / 1000.0;
+  LOG(WARNING) << prefix << "START COMMUNICATION TIME: " << startcomm_time << " ms";
+  for (int layer_idx = 0; layer_idx < layers().size(); layer_idx++) {
+    LOG(WARNING) << "LAYER-" << layer_idx << " "
+      << layers()[layer_idx]->type()
+      << ": startcomm_time: " << startcomm_timers[layer_idx] / 1000.0
+      << " ms";
+  }
+  LOG(WARNING) << std::endl;
+
+  double waitcomm_time = std::accumulate(waitcomm_timers.begin(),
+      waitcomm_timers.end(), 0.0) / 1000.0;
+  LOG(WARNING) << prefix << "WAIT COMMUNICATION TIME: " << waitcomm_time << " ms";
+  for (int layer_idx = 0; layer_idx < layers().size(); layer_idx++) {
+    LOG(WARNING) << "LAYER-" << layer_idx << " "
+      << layers()[layer_idx]->type()
+      << ": waitcomm_time: " << waitcomm_timers[layer_idx] / 1000.0
+      << " ms";
+  }
+  LOG(WARNING) << std::endl;
+
+  LOG(WARNING) << prefix << "TIME (Computation + Communication): " << (forward_time +
+      backward_time + update_time + cleardiffs_time + startcomm_time + waitcomm_time) / 1000.0
+    << " sec";
+#else
+  LOG(WARNING) << prefix << "TIME (Computation): " << (forward_time +
+      backward_time + update_time + cleardiffs_time) / 1000.0 << " sec";
+#endif
+
+  LOG(WARNING) << "####################################################";
+  LOG(WARNING) << std::endl;
+}
+
+#endif /* CAFFE_PER_LAYER_TIMINGS */
+
+
 INSTANTIATE_CLASS(Net);
 
 }  // namespace caffe
diff --git a/src/caffe/solver.cpp b/src/caffe/solver.cpp
index f566ce935..579bde991 100644
--- a/src/caffe/solver.cpp
+++ b/src/caffe/solver.cpp
@@ -122,11 +122,6 @@ void Solver<Dtype>::Init(const SolverParameter& param) {
   }
   iter_ = 0;
   current_step_ = 0;
-
-#ifdef CAFFE_PER_LAYER_TIMINGS
-  InitTimers();
-  net_->set_root_solver(this);
-#endif
 }
 
 template <typename Dtype>
@@ -357,8 +352,8 @@ void Solver<Dtype>::Step(int iters) {
     iter_time += iter_timer.MilliSeconds();
 
 #ifdef CAFFE_PER_LAYER_TIMINGS
-    PrintTimers(false);
-    ResetTimers();
+    net_->PrintTimers(false);
+    net_->ResetTimers();
 
     if (mn::get_node_id() == 0)
         LOG(INFO) << "iter " << iter_ << ", forward_backward_update_time: "
@@ -386,184 +381,11 @@ void Solver<Dtype>::Step(int iters) {
   }
 
 #ifdef CAFFE_PER_LAYER_TIMINGS
-  ResetTimers();
-  PrintTimers(true);
-#endif
-}
-
-#ifdef CAFFE_PER_LAYER_TIMINGS
-
-template <typename Dtype>
-void Solver<Dtype>::InitTimers() {
-  int layer_count = net_->layers().size();
-
-  this->forward_time_per_layer.resize(layer_count, 0.0);
-  this->backward_time_per_layer.resize(layer_count, 0.0);
-  this->update_time_per_layer.resize(layer_count, 0.0);
-  this->cleardiffs_time_per_iter = 0.0;
-#ifdef USE_MLSL
-  this->startcomm_time_per_layer.resize(layer_count, 0.0);
-  this->waitcomm_time_per_layer.resize(layer_count, 0.0);
-#endif
-  this->forward_time_per_layer_total.resize(layer_count, 0.0);
-  this->backward_time_per_layer_total.resize(layer_count, 0.0);
-  this->update_time_per_layer_total.resize(layer_count, 0.0);
-  this->cleardiffs_time_per_iter_total = 0.0;
-#ifdef USE_MLSL
-  this->startcomm_time_per_layer_total.resize(layer_count, 0.0);
-  this->waitcomm_time_per_layer_total.resize(layer_count, 0.0);
-#endif
-}
-
-template <typename Dtype>
-void Solver<Dtype>::ResetTimers() {
-  std::transform(this->forward_time_per_layer_total.begin(),
-                 this->forward_time_per_layer_total.end(),
-                 this->forward_time_per_layer.begin(),
-                 this->forward_time_per_layer_total.begin(),
-                 std::plus<double>());
-
-  std::transform(this->backward_time_per_layer_total.begin(),
-                 this->backward_time_per_layer_total.end(),
-                 this->backward_time_per_layer.begin(),
-                 this->backward_time_per_layer_total.begin(),
-                 std::plus<double>());
-
-  std::transform(this->update_time_per_layer_total.begin(),
-                 this->update_time_per_layer_total.end(),
-                 this->update_time_per_layer.begin(),
-                 this->update_time_per_layer_total.begin(),
-                 std::plus<double>());
-  this->cleardiffs_time_per_iter_total += this->cleardiffs_time_per_iter;
-#ifdef USE_MLSL
-  std::transform(this->startcomm_time_per_layer_total.begin(),
-                 this->startcomm_time_per_layer_total.end(),
-                 this->startcomm_time_per_layer.begin(),
-                 this->startcomm_time_per_layer_total.begin(),
-                 std::plus<double>());
-
-  std::transform(this->waitcomm_time_per_layer_total.begin(),
-                 this->waitcomm_time_per_layer_total.end(),
-                 this->waitcomm_time_per_layer.begin(),
-                 this->waitcomm_time_per_layer_total.begin(),
-                 std::plus<double>());
-#endif
-
-  std::fill(this->forward_time_per_layer.begin(),
-          this->forward_time_per_layer.end(), 0.0);
-  std::fill(this->backward_time_per_layer.begin(),
-          this->backward_time_per_layer.end(), 0.0);
-  std::fill(this->update_time_per_layer.begin(),
-          this->update_time_per_layer.end(), 0.0);
-  this->cleardiffs_time_per_iter = 0.0;
-#ifdef USE_MLSL
-  std::fill(this->startcomm_time_per_layer.begin(),
-          this->startcomm_time_per_layer.end(), 0.0);
-  std::fill(this->waitcomm_time_per_layer.begin(),
-          this->waitcomm_time_per_layer.end(), 0.0);
+  net_->ResetTimers();
+  net_->PrintTimers(true);
 #endif
 }
 
-template <typename Dtype>
-void Solver<Dtype>::PrintTimers(bool printTotal) {
-#ifdef USE_MLSL
-    if (mn::get_node_id() != 0)
-       return;
-#endif
-
-    LOG(WARNING) << std::endl;
-    LOG(WARNING) << "####################################################";
-
-    std::vector<double>& forward_timers = printTotal ?
-        forward_time_per_layer_total : forward_time_per_layer;
-    std::vector<double>& backward_timers = printTotal ?
-        backward_time_per_layer_total : backward_time_per_layer;
-    std::vector<double>& update_timers = printTotal ?
-        update_time_per_layer_total : update_time_per_layer;
-    double cleardiffs_timer = printTotal ?
-        cleardiffs_time_per_iter_total : cleardiffs_time_per_iter;
-#ifdef USE_MLSL
-    std::vector<double>& startcomm_timers = printTotal ?
-        startcomm_time_per_layer_total : startcomm_time_per_layer;
-    std::vector<double>& waitcomm_timers = printTotal ?
-        waitcomm_time_per_layer_total : waitcomm_time_per_layer;
-    std::string prefix = printTotal ? "TOTAL " : "DELTA ";
-#endif
-
-    double forward_time = std::accumulate(forward_timers.begin(),
-            forward_timers.end(), 0.0) / 1000.0;
-    LOG(WARNING) << prefix << "FORWARD TIME: " << forward_time << " ms";
-    for (int layer_idx = 0; layer_idx < net_->layers().size(); layer_idx++) {
-        LOG(WARNING) << "LAYER-" << layer_idx << " "
-                     << net_->layers()[layer_idx]->type()
-                     << ": forward_time: " << forward_timers[layer_idx] / 1000.0
-                     << " ms";
-    }
-    LOG(WARNING) << std::endl;
-
-    double backward_time = std::accumulate(backward_timers.begin(),
-            backward_timers.end(), 0.0) / 1000.0;
-    LOG(WARNING) << prefix << "BACKWARD TIME: " << backward_time << " ms";
-    for (int layer_idx = 0; layer_idx < net_->layers().size(); layer_idx++) {
-        LOG(WARNING) << "LAYER-" << layer_idx << " "
-                     << net_->layers()[layer_idx]->type()
-                     << ": backward_time: " << backward_timers[layer_idx] / 1000.0
-                     << " ms";
-    }
-    LOG(WARNING) << std::endl;
-
-    double update_time = std::accumulate(update_timers.begin(),
-            update_timers.end(), 0.0) / 1000.0;
-    LOG(WARNING) << prefix << "UPDATE TIME: " << update_time << " ms";
-    for (int layer_idx = 0; layer_idx < net_->layers().size(); layer_idx++) {
-        LOG(WARNING) << "LAYER-" << layer_idx << " "
-                     << net_->layers()[layer_idx]->type()
-                     << ": update_time: " << update_timers[layer_idx] / 1000.0
-                     << " ms";
-    }
-    LOG(WARNING) << std::endl;
-
-    double cleardiffs_time = cleardiffs_timer / 1000.0;
-    LOG(WARNING) << prefix << "CLEAR PARAMETER DIFFS TIME: " << cleardiffs_time << " ms";
-    LOG(WARNING) << std::endl;
-
-#ifdef USE_MLSL
-    double startcomm_time = std::accumulate(startcomm_timers.begin(),
-            startcomm_timers.end(), 0.0) / 1000.0;
-    LOG(WARNING) << prefix << "START COMMUNICATION TIME: " << startcomm_time << " ms";
-    for (int layer_idx = 0; layer_idx < net_->layers().size(); layer_idx++) {
-        LOG(WARNING) << "LAYER-" << layer_idx << " "
-                     << net_->layers()[layer_idx]->type()
-                     << ": startcomm_time: " << startcomm_timers[layer_idx] / 1000.0
-                     << " ms";
-    }
-    LOG(WARNING) << std::endl;
-
-    double waitcomm_time = std::accumulate(waitcomm_timers.begin(),
-            waitcomm_timers.end(), 0.0) / 1000.0;
-    LOG(WARNING) << prefix << "WAIT COMMUNICATION TIME: " << waitcomm_time << " ms";
-    for (int layer_idx = 0; layer_idx < net_->layers().size(); layer_idx++) {
-        LOG(WARNING) << "LAYER-" << layer_idx << " "
-                     << net_->layers()[layer_idx]->type()
-                     << ": waitcomm_time: " << waitcomm_timers[layer_idx] / 1000.0
-                     << " ms";
-    }
-    LOG(WARNING) << std::endl;
-
-    LOG(WARNING) << prefix << "TIME (Computation + Communication): " << (forward_time +
-        backward_time + update_time + cleardiffs_time + startcomm_time + waitcomm_time) / 1000.0
-        << " sec";
-#else
-    LOG(WARNING) << prefix << "TIME (Computation): " << (forward_time +
-        backward_time + update_time + cleardiffs_time) / 1000.0 << " sec";
-#endif
-
-    LOG(WARNING) << "####################################################";
-    LOG(WARNING) << std::endl;
-}
-
-#endif /* CAFFE_PER_LAYER_TIMINGS */
-
 template <typename Dtype>
 void Solver<Dtype>::Solve(const char* resume_file) {
   CHECK(Caffe::root_solver());
diff --git a/src/caffe/solvers/sgd_solver.cpp b/src/caffe/solvers/sgd_solver.cpp
index dbd916dd9..37b52ea99 100644
--- a/src/caffe/solvers/sgd_solver.cpp
+++ b/src/caffe/solvers/sgd_solver.cpp
@@ -49,11 +49,15 @@ namespace caffe {
 #ifdef CAFFE_PER_LAYER_TIMINGS
 
 #define LAYER_UPDATE_TIMING_START() do { \
-  this->timer.Start(); \
+  if (this->net_->phase() == TRAIN) { \
+    this->net_->timer.Start(); \
+  } \
 }while(0)
 
 #define LAYER_UPDATE_TIMING_STOP(index) do { \
-  this->update_time_per_layer[index] += this->timer.MicroSeconds(); \
+  if (this->net_->phase() == TRAIN) { \
+    this->net_->update_time_per_layer[index] += this->net_->timer.MicroSeconds(); \
+  } \
 }while(0)
 
 #else

From d1c6d38d7cd906d85328c41dad99f487925c0daf Mon Sep 17 00:00:00 2001
From: fzou1 <feng.zou@intel.com>
Date: Tue, 12 Dec 2017 15:23:16 +0800
Subject: [PATCH 09/53] support engine, caffe_bin, data_source in OOB scripts;
 and fix issue of finding data source also fix an issue of sorting ip address
 (ICL-345)

Change-Id: I103c4e0f06b9473f84c3f9a297bf81ce40438500
---
 scripts/build_intelcaffe.sh |  4 +++
 scripts/run_benchmark.sh    | 51 ++++++++++++++++++++++++++++++++-----
 scripts/run_intelcaffe.sh   | 33 +++++++++++++++++-------
 3 files changed, 73 insertions(+), 15 deletions(-)

diff --git a/scripts/build_intelcaffe.sh b/scripts/build_intelcaffe.sh
index d9bddaeca..168d04fc3 100755
--- a/scripts/build_intelcaffe.sh
+++ b/scripts/build_intelcaffe.sh
@@ -55,6 +55,10 @@ function build_caffe_gcc
         echo "DEBUG := 1" >> Makefile.config
     fi
 
+    if [ "$boost_root" != "" ]; then
+        echo "BOOST_ROOT := $boost_root" >> Makefile.config
+    fi
+
     if [ $is_rebuild -eq 1 ]; then
         make clean
     fi
diff --git a/scripts/run_benchmark.sh b/scripts/run_benchmark.sh
index d73cf9987..c03fe50c3 100755
--- a/scripts/run_benchmark.sh
+++ b/scripts/run_benchmark.sh
@@ -16,7 +16,7 @@ cpu_model="skx"
 unknown_cpu=0
 
 # specify default engine for running caffe benchmarks
-engine="MKLDNN"
+engine=""
 
 # default support single node
 numnodes=1
@@ -25,7 +25,10 @@ numnodes=1
 intelcaffe_log_file=""
 
 # specific script used to run intelcaffe 
-caffe_bin="./scripts/run_intelcaffe.sh"
+caffe_run_script="./scripts/run_intelcaffe.sh"
+
+# path of caffe binary
+caffe_bin=""
 
 # iterations to run benchmark
 iterations=100
@@ -37,11 +40,15 @@ host_file=""
 network="opa"
 tcp_netmask=""
 
+
+data_source="dummy"
+
 function usage
 {
     script_name=$0
     echo "Usage:"
     echo "   $script_name --topology network_topology [--hostfile host_file] [--network opa/tcp] [--netmask tcp_netmask]"
+    echo "                [--data_source lmdb/dummy] [--caffe_bin caffe_bin_path] [--engine engine]"
     echo ""
     echo "   Parameters:"
     echo "     topology: network topology used to benchmark, support alexnet, googlenet, googlenet_v2, resnet_50"
@@ -49,6 +56,10 @@ function usage
     echo "     hostfile: host_file needed in multinodes mode, should contain list of nodes ips or hostnames"
     echo "     network: opa(default), tcp, used in multinodes mode to specify the network type"
     echo "     netmask: only used if network is tcp, set as the net work card name within your network"
+    echo "     data_source: dummy(default), lmdb. data source for neural network."
+    echo "     caffe_bin_path: specify path of caffe binary."
+    echo "     engine: empty value(default), MKL2017 and MKLDNN. Default empty value"
+    echo "             is to use default engine in Intel Caffe."
     echo ""
 }
 
@@ -99,15 +110,31 @@ function detect_cpu
 function run_specific_model
 {
     if [ $numnodes -eq 1 ]; then
-        model_file="models/intel_optimized_models/${model}/${cpu_model}/train_val_dummydata.prototxt"
-        exec_command="${caffe_bin} --model_file ${model_file} --mode time --iteration ${iterations} --benchmark none"
+        if [ "$data_source" == "dummy" ]; then
+            model_file="models/intel_optimized_models/${model}/${cpu_model}/train_val_dummydata.prototxt"
+        else
+            model_file="models/intel_optimized_models/${model}/${cpu_model}/train_val.prototxt"
+        fi
+        exec_command="${caffe_run_script} --model_file ${model_file} --mode time --iteration ${iterations} --benchmark none"
     else
-        solver_file="models/intel_optimized_models/${model}/${cpu_model}/solver_dummydata.prototxt"
-        exec_command="${caffe_bin} --hostfile $host_file --solver $solver_file --network $network --benchmark none"
+        if [ "$data_source" == "dummy" ]; then
+            solver_file="models/intel_optimized_models/${model}/${cpu_model}/solver_dummydata.prototxt"
+        else
+            solver_file="models/intel_optimized_models/${model}/${cpu_model}/solver.prototxt"
+        fi
+
+        exec_command="${caffe_run_script} --hostfile $host_file --solver $solver_file --network $network --benchmark none"
         if [ $network == "tcp" ]; then
             exec_command+=" --netmask $tcp_netmask"
         fi
     fi 
+    
+    if [ "$engine" != "" ]; then
+        exec_command+=" --engine $engine"
+    fi
+    if [ "$caffe_bin" != "" ]; then
+        exec_command+=" --caffe_bin $caffe_bin"
+    fi
 
     # Result file to save detailed run intelcaffe results
     if [ $unknown_cpu -eq 0 ]; then
@@ -267,6 +294,18 @@ do
             tcp_netmask="$2"
             shift
             ;;
+        --engine)
+            engine="$2"
+            shift
+            ;;
+        --data_source)
+            data_source="$2"
+            shift
+            ;;
+        --caffe_bin)
+            caffe_bin=$2
+            shift
+            ;;
         *)
             echo "Unknown option: $key"
             usage
diff --git a/scripts/run_intelcaffe.sh b/scripts/run_intelcaffe.sh
index d5c2f6838..27e90cef7 100755
--- a/scripts/run_intelcaffe.sh
+++ b/scripts/run_intelcaffe.sh
@@ -54,6 +54,8 @@ mpibench_param="allreduce"
 
 script_dir=$(dirname $0)
 
+caffe_bin=""
+
 function usage
 {
     script_name=$0
@@ -69,6 +71,7 @@ function usage
     echo "               [--output output_folder]"
     echo "               [--mpibench_bin mpibench_bin]"
     echo "               [--mpibench_param mpibench_param]"
+    echo "               [--caffe_bin  caffe_binary_path]"
     echo ""
     echo "  Parameters:"
     echo "    hostfile: host file includes list of nodes. Only used if you're running with multinode"
@@ -89,6 +92,8 @@ function usage
     echo "    output_folder: output folder for storing results"
     echo "    mpibench_bin: IMB-MPI1 (default). relative path of binary of mpi benchmark."
     echo "    mpibench_param: allreduce (default). parameter of mpi benchmark."
+    echo "    caffe_binary_path: path of caffe binary."
+    echo ""
 }
 
 declare -a cpu_list=("Intel Xeon E5-26xx (Broadwell)" "Intel Xeon Phi 72xx (Knights Landing)" 
@@ -335,7 +340,7 @@ function test_ssh_connection
 {
     host_file_=$1
     if [ "$host_file_" != "" ]; then
-        host_list=( `cat $host_file_ | sort | uniq ` )
+        host_list=( `cat $host_file_ | sort -V | uniq ` )
         for host in ${host_list[@]}
         do
             hostname=`ssh $host "hostname"`
@@ -349,7 +354,7 @@ function test_ssh_connection
 function get_model_fname
 {
     solver_file_=$1
-    model_file_=$(grep -w "net:" $solver_file_ | head -n 1 | awk -F ':' '{print $2}' | sed 's/\"//g')
+    model_file_=$(grep -w "net:" $solver_file_ | head -n 1 | awk -F ':' '{print $2}' | sed 's/\"//g' | sed 's/\r//g')
     echo "$(echo $model_file_)"
 }
 
@@ -357,14 +362,13 @@ function check_lmdb_files
 {
     model_file_=$1
     
-    lmdb_dirs=(ilsvrc12_train_lmdb ilsvrc12_val_lmdb) 
     is_missing_lmdb=0
+    lmdb_dirs=($(grep -w "source:" $model_file_ | sed 's/^ *//g' | grep -v "^#" | awk -F ' ' '{print $(NF)}' | sed 's/\"//g' | sed 's/\r//g'))
     for lmdb_dir in "${lmdb_dirs[@]}"
     do
-        data_source_dir=$(grep -w "$lmdb_dir" $model_file_ | head -n 1 | awk -F ' ' '{print $(NF)}' | sed 's/\"//g')
-        echo "    LMDB data source: $data_source_dir"
-        if [ ! -d $data_source_dir ]; then
-            echo "Error: LMDB data source doesn't exist ($data_source_dir)."
+        echo "    LMDB data source: $lmdb_dir"
+        if [ ! -d "$lmdb_dir" ]; then
+            echo "Error: LMDB data source doesn't exist ($lmdb_dir)."
             let is_missing_lmdb=1
         fi
     done
@@ -475,6 +479,14 @@ do
         --help)
             usage
             ;;
+        --engine)
+            engine=$2
+            shift
+            ;;
+        --caffe_bin)
+            caffe_bin=$2
+            shift
+            ;;
         *)
             echo "Unknown option: $key"
             usage
@@ -565,7 +577,7 @@ fi
 # Names to configfile, binary (executable) files #
 # Add check for host_file's existence to support single node
 if [[ $host_file != "" ]]; then
-    nodenames=( `cat $host_file | sort | uniq ` )
+    nodenames=( `cat $host_file | sort -V | uniq ` )
     if [ ${#nodenames[@]} -eq 0 ]; then
         echo "Error: empty host file! Exit."
         exit 0
@@ -601,7 +613,10 @@ if [ "${benchmark_mode}" != "none" ]; then
 fi
 
 if [ "${mode}" != "none" ]; then
-    caffe_bin="./build/tools/caffe"
+    if [ "$caffe_bin" == "" ]; then
+      caffe_bin="${root_dir}/build/tools/caffe"
+    fi
+
     check_dependency $caffe_bin
     if [ $? -ne 0 ]; then
         echo "Exit."

From ea1a4d966733f4b2b989fdbb792ce2554b47cbf5 Mon Sep 17 00:00:00 2001
From: "Zhang, Guoming" <guoming.zhang@intel.com>
Date: Thu, 14 Dec 2017 12:52:55 +0800
Subject: [PATCH 10/53] Fix for issue ICL-351 by adding the engine checker for
 conv/sum fusion.

---
 src/caffe/net.cpp | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
index a5c037668..b8169f78e 100644
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -888,7 +888,7 @@ template <typename Dtype>
 void Net<Dtype>::CompilationRuleFour(const NetParameter& param,
                                      NetParameter* param_compiled) {
   // only apply this rule for inference(TEST) phase
-  if (param.state().phase() != TEST) {
+  if (param.state().phase() != TEST || param.engine().compare("MKLDNN") != 0) {
     param_compiled->CopyFrom(param);
     return;
   }
@@ -897,7 +897,10 @@ void Net<Dtype>::CompilationRuleFour(const NetParameter& param,
   for (int i = 0; i < param.layer_size(); i++) {
     LayerParameter* layer_param =
         (const_cast<NetParameter&>(param)).mutable_layer(i);
-    if (layer_param->type().compare("Convolution") == 0) {
+    if (layer_param->type().compare("Convolution") == 0 
+        && (layer_param->has_engine() == false
+        || (layer_param->has_engine() == true
+        && layer_param->engine().compare("MKLDNN") ==0))) {
       std::vector<const LayerParameter*> child_layers_params;
       Net<Dtype>::GetBlobConsumers(child_layers_params, layer_param->top(0),
                                    param,

From ae3793c9bdbefcf1a8202dc7bfd824a9d6445f15 Mon Sep 17 00:00:00 2001
From: "Zhang, Guoming" <guoming.zhang@intel.com>
Date: Thu, 14 Dec 2017 22:36:54 +0800
Subject: [PATCH 11/53] Remove the deprecated conv/relu fusion api.

---
 src/caffe/layers/mkldnn_convolution_layer.cpp | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/caffe/layers/mkldnn_convolution_layer.cpp b/src/caffe/layers/mkldnn_convolution_layer.cpp
index ab0ec7617..1ac34b5fb 100644
--- a/src/caffe/layers/mkldnn_convolution_layer.cpp
+++ b/src/caffe/layers/mkldnn_convolution_layer.cpp
@@ -204,7 +204,6 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionFwd(const vector<Blob<Dtype>*
       subengines = "MKLDNN:CPU";
     EngineParser ep(subengines);
     unsigned subEngineIndex = 0;
-    shared_ptr<convolution_relu_forward::primitive_desc> convReluFwd_pd = NULL;
     mkldnn::algorithm eligibleAlgorithms[2] = {conv_algorithm, algorithm::convolution_direct};
     convFwd_pd = NULL;
     mkldnn::primitive_attr attr;

From 097e8485367374dbe5f9047a891ddacd91d1e0e8 Mon Sep 17 00:00:00 2001
From: "Yu, Chong" <chong.yu@intel.com>
Date: Mon, 18 Dec 2017 01:22:55 +0800
Subject: [PATCH 12/53] Update MKLDNN version to 82cf37f626.

---
 mkldnn.commit | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/mkldnn.commit b/mkldnn.commit
index f28f6c194..ed29e5f9d 100644
--- a/mkldnn.commit
+++ b/mkldnn.commit
@@ -1 +1 @@
-aab753280e83137ba955f8f19d72cb6aaba545ef
+82cf37f626a0998d38f99c30e5a08a0dd5e49bc0
\ No newline at end of file

From 9e89fa3b695343bd5c9842f19723903c162a2a16 Mon Sep 17 00:00:00 2001
From: "Tian, Feng" <feng.tian@intel.com>
Date: Tue, 19 Dec 2017 08:42:42 +0800
Subject: [PATCH 13/53] Fix shape and prv format mismatch issue in
 Reshape/Flatten layer as they change the shape but bottom prv is directly
 shared to top prv.

It will cause MKLDNN primitive creation assertion.
---
 src/caffe/blob.cpp | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/src/caffe/blob.cpp b/src/caffe/blob.cpp
index 4a2beb8eb..627735ee2 100644
--- a/src/caffe/blob.cpp
+++ b/src/caffe/blob.cpp
@@ -245,12 +245,18 @@ shared_ptr<PrvMemDescr> Blob<Dtype>::get_prv_diff_descriptor() {
 template <typename Dtype>
 void Blob<Dtype>::ShareData(const Blob& other) {
   CHECK_EQ(count_, other.count());
+  // Although the count is same, we have to forcedly sync data to cpu if shape is changed.
+  // This is used to avoid mismatch between cpu shape and prv data.
+  if(this->shape() != other.shape() && other.data()) other.data()->mutable_cpu_data();
   data_ = other.data();
 }
 
 template <typename Dtype>
 void Blob<Dtype>::ShareDiff(const Blob& other) {
   CHECK_EQ(count_, other.count());
+  // Although the count is same, we have to forcedly sync data to cpu if shape is changed.
+  // This is used to avoid mismatch between cpu shape and prv data.
+  if(this->shape() != other.shape() && other.diff()) other.diff()->mutable_cpu_data();
   diff_ = other.diff();
 }
 

From 356f1b59d312c114ca5290d8e9923beb37af0513 Mon Sep 17 00:00:00 2001
From: fzou1 <feng.zou@intel.com>
Date: Fri, 15 Dec 2017 14:59:20 +0800
Subject: [PATCH 14/53] add timeline for multinode and print payload size

Change-Id: I3f916afc590c45ad96167aa40e53aa9f7f1a3d68
---
 include/caffe/multinode/multi_solver.hpp |   2 +-
 include/caffe/net.hpp                    |  25 ++-
 include/caffe/util/benchmark.hpp         |   7 +
 src/caffe/multinode/multi_solver.cpp     |  95 ++++++------
 src/caffe/net.cpp                        | 186 +++++++++++++++++++++--
 src/caffe/solver.cpp                     |   3 +
 src/caffe/solvers/sgd_solver.cpp         |  15 +-
 src/caffe/util/benchmark.cpp             |  14 ++
 8 files changed, 279 insertions(+), 68 deletions(-)

diff --git a/include/caffe/multinode/multi_solver.hpp b/include/caffe/multinode/multi_solver.hpp
index 5c4452aa6..bebab3c6c 100644
--- a/include/caffe/multinode/multi_solver.hpp
+++ b/include/caffe/multinode/multi_solver.hpp
@@ -111,7 +111,7 @@ class MultiSolver {
 #endif
  private:
   virtual Dtype ForwardBackwardImpl(bool first, bool last);
-  bool IsSkipWaitGradient(int layer_id);
+  bool IsSkipSyncGradient(int layer_id);
   bool WaitGradient(int layer_id);
   void UpdateGradient(int layer_id);
 
diff --git a/include/caffe/net.hpp b/include/caffe/net.hpp
index ad1411bc2..3359ac813 100644
--- a/include/caffe/net.hpp
+++ b/include/caffe/net.hpp
@@ -356,6 +356,19 @@ class Net {
 #ifdef USE_MLSL
   std::vector<double> startcomm_time_per_layer;
   std::vector<double> waitcomm_time_per_layer;
+
+  std::vector<double> startcomm_start_time_per_layer;
+  std::vector<double> waitcomm_start_time_per_layer;
+  std::vector<double> startcomm_stop_time_per_layer;
+  std::vector<double> waitcomm_stop_time_per_layer;
+
+#ifdef FW_OVERLAP_OPT
+  std::vector<double> first_waitcomm_start_time_per_layer;
+  std::vector<double> first_waitcomm_stop_time_per_layer;
+  std::vector<double> first_update_start_time_per_layer;
+  std::vector<double> first_update_stop_time_per_layer;
+#endif
+
 #endif
 
   std::vector<double> forward_time_per_layer_total;
@@ -367,12 +380,22 @@ class Net {
   std::vector<double> waitcomm_time_per_layer_total;
 #endif
 
+  std::vector<double> forward_start_time_per_layer;
+  std::vector<double> backward_start_time_per_layer;
+  std::vector<double> update_start_time_per_layer;
+
+  std::vector<double> forward_stop_time_per_layer;
+  std::vector<double> backward_stop_time_per_layer;
+  std::vector<double> update_stop_time_per_layer;
+
   void InitTimers();
   void ResetTimers();
   void PrintTimers(bool printTotal);
 
-#endif /* CAFFE_PER_LAYER_TIMINGS */
+  void PrintPayloadSize();
+  void SaveTimeline();
 
+#endif /* CAFFE_PER_LAYER_TIMINGS */
 
  protected:
   // Helpers for Init.
diff --git a/include/caffe/util/benchmark.hpp b/include/caffe/util/benchmark.hpp
index cc0041643..fa7e36663 100644
--- a/include/caffe/util/benchmark.hpp
+++ b/include/caffe/util/benchmark.hpp
@@ -54,6 +54,10 @@ class Timer {
   virtual float MicroSeconds();
   virtual float Seconds();
 
+  virtual void InitTime();
+  virtual void InitTime(Timer &);
+  virtual float Duration();
+
   inline bool initted() { return initted_; }
   inline bool running() { return running_; }
   inline bool has_run_at_least_once() { return has_run_at_least_once_; }
@@ -68,6 +72,9 @@ class Timer {
   cudaEvent_t start_gpu_;
   cudaEvent_t stop_gpu_;
 #endif
+
+  boost::posix_time::ptime init_cpu_;
+
   boost::posix_time::ptime start_cpu_;
   boost::posix_time::ptime stop_cpu_;
   float elapsed_milliseconds_;
diff --git a/src/caffe/multinode/multi_solver.cpp b/src/caffe/multinode/multi_solver.cpp
index a4bdbbe90..686e076eb 100644
--- a/src/caffe/multinode/multi_solver.cpp
+++ b/src/caffe/multinode/multi_solver.cpp
@@ -43,33 +43,38 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 #include <boost/bind.hpp>
 
 #include "caffe/multinode/multi_solver.hpp"
+#include "caffe/util/performance.hpp"
 
 namespace caffe {
 
 #ifdef CAFFE_PER_LAYER_TIMINGS
 
-#define LAYER_TIMING_START() do { \
+#define LAYER_TIMING_START(name, index) do { \
   if (root_solver_->net()->phase() == TRAIN) { \
-    root_solver_->net()->timer.Start(); \
+    root_solver_->net()->name##_start_time_per_layer[index] = root_solver_->net()->timer.Duration(); \
   } \
 }while(0)
 
-#define LAYER_TIMING_STOP(name, index) do { \
+#define LAYER_TIMING_STOP_2(layer_time_name, name, index) do { \
   if (root_solver_->net()->phase() == TRAIN) { \
-    root_solver_->net()->name##_time_per_layer[index] += root_solver_->net()->timer.MicroSeconds(); \
+    root_solver_->net()->name##_stop_time_per_layer[index] = root_solver_->net()->timer.Duration(); \
+    root_solver_->net()->layer_time_name##_time_per_layer[index] += (root_solver_->net()->name##_stop_time_per_layer[index] - root_solver_->net()->name##_start_time_per_layer[index]); \
   } \
 }while(0)
 
+#define LAYER_TIMING_STOP(name, index) LAYER_TIMING_STOP_2(name,name,index)
+
 #ifdef FW_OVERLAP_OPT
-#define LAYER_WAIT_TIMING_START() do { \
+#define LAYER_WAIT_TIMING_START(index) do { \
   if (root_solver_->net()->phase() == TRAIN) { \
-    root_solver_->net()->wait_timer.Start(); \
+    root_solver_->net()->first_waitcomm_start_time_per_layer[index] = root_solver_->net()->wait_timer.Duration(); \
   } \
 }while(0)
 
-#define LAYER_WAIT_TIMING_STOP(layer_index) do { \
+#define LAYER_WAIT_TIMING_STOP(index) do { \
   if (root_solver_->net()->phase() == TRAIN) { \
-    root_solver_->net()->waitcomm_time_per_layer[layer_index] += root_solver_->net()->wait_timer.MicroSeconds(); \
+    root_solver_->net()->first_waitcomm_stop_time_per_layer[index] = root_solver_->net()->wait_timer.Duration(); \
+    root_solver_->net()->waitcomm_time_per_layer[index] += (root_solver_->net()->first_waitcomm_stop_time_per_layer[index] - root_solver_->net()->first_waitcomm_start_time_per_layer[index]); \
   } \
 }while(0)
 
@@ -82,11 +87,12 @@ namespace caffe {
 
 #else
 
-#define LAYER_TIMING_START()
-#define LAYER_TIMING_STOP(name,index)
+#define LAYER_TIMING_START(name, index)
+#define LAYER_TIMING_STOP(name, index) 
+#define LAYER_TIMING_STOP_2(layer_time_name, name,index)
 
 #ifdef FW_OVERLAP_OPT
-#define LAYER_WAIT_TIMING_START()
+#define LAYER_WAIT_TIMING_START(index)
 #define LAYER_WAIT_TIMING_STOP(index)
 #define LAYER_REMOVE_UPDATE_TIME(layer_i, layer_k)
 #endif
@@ -95,15 +101,14 @@ namespace caffe {
 
 
 template <typename Dtype>
-inline bool MultiSolver<Dtype>::IsSkipWaitGradient(int layer_id) {
+inline bool MultiSolver<Dtype>::IsSkipSyncGradient(int layer_id) {
   Net<Dtype>& net = *root_solver_->net();
   const std::vector<shared_ptr<Layer<Dtype>>>& layers{ net.layers() };
   const std::vector<bool>& layer_need_backward{ net.layer_need_backward() };
 
   if (!layer_need_backward[layer_id] || ((layers[layer_id]->layerOp != nullptr)
         && !layers[layer_id]->layerOp->HasParameterSets())) {
-    DLOG(INFO) << "ForwardBackwardImpl: no need for apply_updates for layer # "
-      << layer_id << ", skip on_delwt_wait, apply_updates, on_wtinc_ready";
+    DLOG(INFO) << "No need for synchronizing gradients for layer # " << layer_id;
     return true;
   }
   return false;
@@ -111,36 +116,27 @@ inline bool MultiSolver<Dtype>::IsSkipWaitGradient(int layer_id) {
 
 template <typename Dtype>
 inline bool MultiSolver<Dtype>::WaitGradient(int layer_id) {
-#ifndef FW_OVERLAP_OPT
-  LAYER_TIMING_START();
-#endif
   for (int j = 0; j < callbacks_.size(); ++j) {
     callbacks_[j]->on_delwt_wait(layer_id);
   }
 
-#ifndef FW_OVERLAP_OPT
-  LAYER_TIMING_STOP(waitcomm, layer_id);
-  return true;
-#else
+#ifdef FW_OVERLAP_OPT
   return layer_finished_flags_[layer_id];
+#else
+  return true;
 #endif
 }
 
 template <typename Dtype>
 inline void MultiSolver<Dtype>::UpdateGradient(int layer_id) {
 #ifdef FW_OVERLAP_OPT
-  if (layer_finished_flags_[layer_id]) {
+    CHECK(layer_finished_flags_[layer_id]);
 #endif
-
-    LAYER_TIMING_START();
+    PERFORMANCE_MEASUREMENT_BEGIN();
     for (int j = 0; j < callbacks_.size(); ++j) {
       callbacks_[j]->apply_updates(layer_id);
     }
-    LAYER_TIMING_STOP(update, layer_id);
-
-#ifdef FW_OVERLAP_OPT
-  }
-#endif
+    PERFORMANCE_MEASUREMENT_END_STATIC("weights_update");
 }
 
 template <typename Dtype>
@@ -153,30 +149,35 @@ Dtype MultiSolver<Dtype>::ForwardBackwardImpl(bool first, bool last) {
   for (int i = 0; i < layers.size(); ++i) {
 #ifdef FW_OVERLAP_OPT
     if (first) {
-      LAYER_WAIT_TIMING_START();
+      LAYER_WAIT_TIMING_START(i);
       while (layer_finished_flags_[i] == false) {
-        if (IsSkipWaitGradient(i))
-           break;
-
+        if (IsSkipSyncGradient(i))
+          break;
         if (WaitGradient(i)) {
           // The function call cannot be moved out of while loop. Otherwise,
           // at first iteration, additional UpdateGradient will be called,
           // even if no gradient is synced.
+          LAYER_TIMING_START(first_update, i);
           UpdateGradient(i);
+          LAYER_TIMING_STOP_2(update, first_update, i);
+
           // The update time for layer i must be removed from waitcomm time
           // for layer i
           LAYER_REMOVE_UPDATE_TIME(i, i);
           break;
         }
-        
+
         // wait and update gradient for next layers
         for (int k=i+1; k<layers.size(); k++) {
-          if (layer_finished_flags_[k] || IsSkipWaitGradient(k)) {
+          if (layer_finished_flags_[k] || IsSkipSyncGradient(k)) {
             layer_finished_flags_[k] = true;
             continue;
           }
           if (WaitGradient(k)) {
+            LAYER_TIMING_START(first_update, k);
             UpdateGradient(k);
+            LAYER_TIMING_STOP_2(update, first_update, k);
+
             // The update time for layer k must be removed from waitcomm time
             // for layer i
             LAYER_REMOVE_UPDATE_TIME(i, k);
@@ -184,7 +185,6 @@ Dtype MultiSolver<Dtype>::ForwardBackwardImpl(bool first, bool last) {
           }
         }
       }
-
       LAYER_WAIT_TIMING_STOP(i);
       // set flag to false after updating gradient
       layer_finished_flags_[i] = false;
@@ -193,7 +193,7 @@ Dtype MultiSolver<Dtype>::ForwardBackwardImpl(bool first, bool last) {
 
     loss += net.ForwardFromTo(i, i);
   }
-
+  
   // Clear parameter diffs after communication is finished (that is, after 
   // calling WaitGradientComm)
   if (first) {
@@ -207,18 +207,15 @@ Dtype MultiSolver<Dtype>::ForwardBackwardImpl(bool first, bool last) {
     
     net.BackwardFromTo(i, i);
 
-    if (last && (layers[i]->layerOp != nullptr)
-        && layers[i]->layerOp->HasParameterSets()) {
-
-      LAYER_TIMING_START();
+    LAYER_TIMING_START(startcomm, i);
+    if (last && IsSkipSyncGradient(i) == false) {
       for (int j = 0; j < callbacks_.size(); ++j) {
         callbacks_[j]->on_backward_finished(i);
       }
-      LAYER_TIMING_STOP(startcomm, i);
     }
+    LAYER_TIMING_STOP(startcomm, i);
   }
 
-
 #ifdef FW_OVERLAP_OPT
   int iter = root_solver_->iter();
   int max_iter = root_solver_->param().max_iter();
@@ -231,11 +228,13 @@ Dtype MultiSolver<Dtype>::ForwardBackwardImpl(bool first, bool last) {
 
   if (last_iter_wait_flag) {
     for (int i = 0; i < layers.size(); ++i) {
-      if (IsSkipWaitGradient(i))
+      LAYER_TIMING_START(waitcomm, i);
+      if (IsSkipSyncGradient(i)) {
+        LAYER_TIMING_STOP(waitcomm, i);
         continue;
+      }
 
 #ifdef FW_OVERLAP_OPT
-      LAYER_WAIT_TIMING_START();
       while (
 #endif
         WaitGradient(i)
@@ -243,11 +242,11 @@ Dtype MultiSolver<Dtype>::ForwardBackwardImpl(bool first, bool last) {
           == false)
 #endif
       ;
+      LAYER_TIMING_STOP(waitcomm, i);
 
-#ifdef FW_OVERLAP_OPT
-      LAYER_WAIT_TIMING_STOP(i);
-#endif
+      LAYER_TIMING_START(update, i);
       UpdateGradient(i);
+      LAYER_TIMING_STOP(update, i);
     }
   }
 
diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
index b8169f78e..74040f1c1 100644
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -64,24 +64,27 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 #include "caffe/util/remove_batch_norm.hpp"
 #include "caffe/util/apply_bn_stats_batch_size.hpp"
 
+
 PERFORMANCE_CREATE_MONITOR();
 
 namespace caffe {
 
 #ifdef CAFFE_PER_LAYER_TIMINGS
 
-#define LAYER_TIMING_START() do { \
+#define LAYER_TIMING_START(name, index) do { \
   if (this->phase() == TRAIN) { \
-    this->timer.Start(); \
+    this->name##_start_time_per_layer[index] = this->timer.Duration(); \
   } \
 }while(0)
 
 #define LAYER_TIMING_STOP(name, index) do { \
   if (this->phase() == TRAIN) { \
-    this->name##_time_per_layer[index] += this->timer.MicroSeconds(); \
+    this->name##_stop_time_per_layer[index] = this->timer.Duration(); \
+    this->name##_time_per_layer[index] += (this->name##_stop_time_per_layer[index] - this->name##_start_time_per_layer[index]); \
   } \
 }while(0)
 
+
 #define ITER_TIMING_START() do { \
   if (this->phase() == TRAIN) { \
     this->timer.Start(); \
@@ -96,7 +99,7 @@ namespace caffe {
 
 #else
 
-#define LAYER_TIMING_START()
+#define LAYER_TIMING_START(name,index)
 #define LAYER_TIMING_STOP(name,index)
 
 #define ITER_TIMING_START()
@@ -1274,7 +1277,7 @@ Dtype Net<Dtype>::ForwardFromTo(int start, int end) {
   CHECK_LT(end, layers_.size());
   Dtype loss = 0;
   for (int i = start; i <= end; ++i) {
-    LAYER_TIMING_START();
+    LAYER_TIMING_START(forward, i);
     PERFORMANCE_MEASUREMENT_BEGIN();
 
     // LOG(ERROR) << "Forwarding " << layer_names_[i];
@@ -1327,7 +1330,8 @@ void Net<Dtype>::BackwardFromTo(int start, int end) {
   CHECK_LT(start, layers_.size());
   for (int i = start; i >= end; --i) {
     if (layer_need_backward_[i]) {
-      LAYER_TIMING_START();
+
+      LAYER_TIMING_START(backward, i);
       PERFORMANCE_MEASUREMENT_BEGIN();
 
       layers_[i]->Backward(
@@ -1335,7 +1339,6 @@ void Net<Dtype>::BackwardFromTo(int start, int end) {
 
       PERFORMANCE_MEASUREMENT_END((std::string("BW_")+layer_names_[i]).c_str());
       LAYER_TIMING_STOP(backward, i);
-
       if (debug_info_) { BackwardDebugInfo(i); }
     }
   }
@@ -1917,17 +1920,43 @@ void Net<Dtype>::InitTimers() {
   this->backward_time_per_layer.resize(layer_count, 0.0);
   this->update_time_per_layer.resize(layer_count, 0.0);
   this->cleardiffs_time_per_iter = 0.0;
-#ifdef USE_MLSL
-  this->startcomm_time_per_layer.resize(layer_count, 0.0);
-  this->waitcomm_time_per_layer.resize(layer_count, 0.0);
-#endif
+
   this->forward_time_per_layer_total.resize(layer_count, 0.0);
   this->backward_time_per_layer_total.resize(layer_count, 0.0);
   this->update_time_per_layer_total.resize(layer_count, 0.0);
   this->cleardiffs_time_per_iter_total = 0.0;
+
+  this->forward_start_time_per_layer.resize(layer_count, 0.0);
+  this->forward_stop_time_per_layer.resize(layer_count, 0.0);
+  this->backward_start_time_per_layer.resize(layer_count, 0.0);
+  this->backward_stop_time_per_layer.resize(layer_count, 0.0);
+  this->update_start_time_per_layer.resize(layer_count, 0.0);
+  this->update_stop_time_per_layer.resize(layer_count, 0.0);
+
 #ifdef USE_MLSL
+  this->startcomm_time_per_layer.resize(layer_count, 0.0);
+  this->waitcomm_time_per_layer.resize(layer_count, 0.0);
+
   this->startcomm_time_per_layer_total.resize(layer_count, 0.0);
   this->waitcomm_time_per_layer_total.resize(layer_count, 0.0);
+
+  this->startcomm_start_time_per_layer.resize(layer_count, 0.0);
+  this->startcomm_stop_time_per_layer.resize(layer_count, 0.0);
+
+#ifdef FW_OVERLAP_OPT
+  this->first_update_start_time_per_layer.resize(layer_count, 0.0);
+  this->first_update_stop_time_per_layer.resize(layer_count, 0.0);
+  this->first_waitcomm_start_time_per_layer.resize(layer_count, 0.0);
+  this->first_waitcomm_stop_time_per_layer.resize(layer_count, 0.0);
+#endif
+
+  this->waitcomm_start_time_per_layer.resize(layer_count, 0.0);
+  this->waitcomm_stop_time_per_layer.resize(layer_count, 0.0);
+#endif
+
+  timer.InitTime();
+#ifdef FW_OVERLAP_OPT
+  wait_timer.InitTime(timer);
 #endif
 }
 
@@ -2078,6 +2107,141 @@ void Net<Dtype>::PrintTimers(bool printTotal) {
   LOG(WARNING) << std::endl;
 }
 
+template <typename Dtype>
+void Net<Dtype>::SaveTimeline() {
+  static bool initialized = false;
+  std::ofstream time_file;
+  string filename = name() + "_timeline"
+#ifdef USE_MLSL
+        + "_" + std::to_string(mn::get_node_id())
+#endif
+        + ".txt";
+  if (initialized)
+    time_file.open(filename, std::ios_base::app);
+  else {
+    initialized = true;
+    time_file.open(filename);
+  }
+
+  time_file << "start,end,type,OP" << std::endl;
+
+  for (int layer_idx = 0; layer_idx < layers().size(); ++layer_idx) {
+    if (forward_start_time_per_layer[layer_idx] == 0
+        || forward_stop_time_per_layer[layer_idx] == 0)
+        continue;
+    time_file << forward_start_time_per_layer[layer_idx] / 1000
+        << "," << forward_stop_time_per_layer[layer_idx] / 1000
+        << ",Comp," << layers()[layer_idx]->type()
+        << std::endl;
+  }
+
+  for (int layer_idx = 0; layer_idx < layers().size(); ++layer_idx) {
+    if (backward_start_time_per_layer[layer_idx] == 0
+        || backward_stop_time_per_layer[layer_idx] == 0)
+        continue;
+    time_file << backward_start_time_per_layer[layer_idx] / 1000
+        << "," << backward_stop_time_per_layer[layer_idx] / 1000
+        << ",Comp," << layers()[layer_idx]->type() << "Grad"
+        << std::endl;
+  }
+
+#if defined(USE_MLSL) && defined(FW_OVERLAP_OPT) 
+  for (int layer_idx = 0; layer_idx < layers().size(); ++layer_idx) {
+    if (first_update_start_time_per_layer[layer_idx] == 0
+        || first_update_stop_time_per_layer[layer_idx] == 0)
+        continue;
+
+    time_file << first_update_start_time_per_layer[layer_idx] / 1000
+        << "," << first_update_stop_time_per_layer[layer_idx] / 1000
+        << ",Comp," << layers()[layer_idx]->type() << "FirstUpdate"
+        << std::endl;
+  }
+#endif
+
+  for (int layer_idx = 0; layer_idx < layers().size(); ++layer_idx) {
+    if (update_start_time_per_layer[layer_idx] == 0
+        || update_stop_time_per_layer[layer_idx] == 0)
+        continue;
+
+    time_file << update_start_time_per_layer[layer_idx] / 1000
+        << "," << update_stop_time_per_layer[layer_idx] / 1000
+        << ",Comp," << layers()[layer_idx]->type() << "Update"
+        << std::endl;
+  }
+
+#ifdef USE_MLSL
+  for (int layer_idx = 0; layer_idx < layers().size(); ++layer_idx) {
+    if (startcomm_start_time_per_layer[layer_idx] == 0
+        || startcomm_stop_time_per_layer[layer_idx] == 0)
+        continue;
+
+    time_file << startcomm_start_time_per_layer[layer_idx] / 1000
+        << "," << startcomm_stop_time_per_layer[layer_idx] / 1000
+        << ",Comm," << layers()[layer_idx]->type() << "Start"
+        << std::endl;
+  }
+
+#ifdef FW_OVERLAP_OPT
+  for (int layer_idx = 0; layer_idx < layers().size(); ++layer_idx) {
+    if (first_waitcomm_start_time_per_layer[layer_idx] == 0
+        || first_waitcomm_stop_time_per_layer[layer_idx] == 0)
+        continue;
+
+    time_file << first_waitcomm_start_time_per_layer[layer_idx] / 1000
+        << "," << first_waitcomm_stop_time_per_layer[layer_idx] / 1000
+        << ",Comm," << layers()[layer_idx]->type() << "FirstWait"
+        << std::endl;
+  }
+#endif
+
+  for (int layer_idx = 0; layer_idx < layers().size(); ++layer_idx) {
+    if (waitcomm_start_time_per_layer[layer_idx] == 0
+        || waitcomm_stop_time_per_layer[layer_idx] == 0)
+        continue;
+
+    time_file << waitcomm_start_time_per_layer[layer_idx] / 1000
+        << "," << waitcomm_stop_time_per_layer[layer_idx] / 1000
+        << ",Comm," << layers()[layer_idx]->type() << "Wait"
+        << std::endl;
+  }
+#endif
+
+  time_file.close();
+}
+
+template <typename Dtype>
+void Net<Dtype>::PrintPayloadSize() {
+#ifdef USE_MLSL
+  if (mn::get_node_id() != 0)
+    return;
+#endif
+
+  int total_payload_size = 0;
+  const vector<Blob<Dtype> *> &net_params (learnable_params());
+
+  LOG(WARNING) << std::endl;
+  LOG(WARNING) << "####################################################";
+
+
+  for (int layer_idx = 0; layer_idx < layers().size(); ++layer_idx) {
+    std::vector<int> param_ids = get_layer_learnable_param_ids(layer_idx);
+    for (int j = 0; j < param_ids.size(); j++) {
+      int layer_payload_size = net_params[param_ids[j]]->count();
+
+      LOG(WARNING) << "LAYER-" << layer_idx << " "
+        << layers()[layer_idx]->type()
+        << ": payload_size: " << layer_payload_size
+        << " units";
+
+      total_payload_size += layer_payload_size;
+    }
+  }
+
+  LOG(WARNING) << "TOTAL PAYLOAD SIZE: " << total_payload_size << " units";
+  LOG(WARNING) << "####################################################";
+  LOG(WARNING) << std::endl;
+}
+
 #endif /* CAFFE_PER_LAYER_TIMINGS */
 
 
diff --git a/src/caffe/solver.cpp b/src/caffe/solver.cpp
index 579bde991..aad9e3596 100644
--- a/src/caffe/solver.cpp
+++ b/src/caffe/solver.cpp
@@ -122,6 +122,7 @@ void Solver<Dtype>::Init(const SolverParameter& param) {
   }
   iter_ = 0;
   current_step_ = 0;
+
 }
 
 template <typename Dtype>
@@ -352,6 +353,7 @@ void Solver<Dtype>::Step(int iters) {
     iter_time += iter_timer.MilliSeconds();
 
 #ifdef CAFFE_PER_LAYER_TIMINGS
+    net_->SaveTimeline();
     net_->PrintTimers(false);
     net_->ResetTimers();
 
@@ -383,6 +385,7 @@ void Solver<Dtype>::Step(int iters) {
 #ifdef CAFFE_PER_LAYER_TIMINGS
   net_->ResetTimers();
   net_->PrintTimers(true);
+  net_->PrintPayloadSize();
 #endif
 }
 
diff --git a/src/caffe/solvers/sgd_solver.cpp b/src/caffe/solvers/sgd_solver.cpp
index 37b52ea99..d3f1d49e6 100644
--- a/src/caffe/solvers/sgd_solver.cpp
+++ b/src/caffe/solvers/sgd_solver.cpp
@@ -48,21 +48,22 @@ namespace caffe {
 
 #ifdef CAFFE_PER_LAYER_TIMINGS
 
-#define LAYER_UPDATE_TIMING_START() do { \
-  if (this->net_->phase() == TRAIN) { \
-    this->net_->timer.Start(); \
+#define LAYER_UPDATE_TIMING_START(index) do { \
+  if (this->net()->phase() == TRAIN) { \
+    this->net()->update_start_time_per_layer[index] = this->net()->timer.Duration(); \
   } \
 }while(0)
 
 #define LAYER_UPDATE_TIMING_STOP(index) do { \
-  if (this->net_->phase() == TRAIN) { \
-    this->net_->update_time_per_layer[index] += this->net_->timer.MicroSeconds(); \
+  if (this->net()->phase() == TRAIN) { \
+    this->net()->update_stop_time_per_layer[index] = this->net()->timer.Duration(); \
+    this->net()->update_time_per_layer[index] += (this->net()->update_stop_time_per_layer[index] - this->net()->update_start_time_per_layer[index]); \
   } \
 }while(0)
 
 #else
 
-#define LAYER_UPDATE_TIMING_START()
+#define LAYER_UPDATE_TIMING_START(index)
 #define LAYER_UPDATE_TIMING_STOP(index)
 
 #endif
@@ -225,7 +226,7 @@ void SGDSolver<Dtype>::ApplyUpdate() {
 #endif
   for (int i=0; i<this->net_->layers().size(); i++) {
     const std::vector<int> param_ids = this->net_->get_layer_learnable_param_ids(i);
-    LAYER_UPDATE_TIMING_START();
+    LAYER_UPDATE_TIMING_START(i);
     for (int param_id = 0; param_id < param_ids.size(); ++param_id) {
       ApplyUpdate(param_ids[param_id]);
     }
diff --git a/src/caffe/util/benchmark.cpp b/src/caffe/util/benchmark.cpp
index a9058ba32..db67f7ded 100644
--- a/src/caffe/util/benchmark.cpp
+++ b/src/caffe/util/benchmark.cpp
@@ -155,6 +155,20 @@ void Timer::Init() {
   }
 }
 
+void Timer::InitTime() {
+  init_cpu_ = boost::posix_time::microsec_clock::local_time();
+}
+
+void Timer::InitTime(Timer &timer_) {
+  init_cpu_ = timer_.init_cpu_;
+}
+
+float Timer::Duration() {
+  boost::posix_time::ptime curr_cpu_ = boost::posix_time::microsec_clock::local_time();
+  float elapsed = (curr_cpu_ - init_cpu_).total_microseconds();
+  return elapsed;
+}
+
 CPUTimer::CPUTimer() {
   this->initted_ = true;
   this->running_ = false;

From 5d7497ff29812fdf31878dfbaa000948b7b06e77 Mon Sep 17 00:00:00 2001
From: "Pan, Daoxin" <daoxin.pan@intel.com>
Date: Tue, 19 Dec 2017 14:43:55 +0800
Subject: [PATCH 15/53] Add codes to enable BN+Relu's fusion.

Change-Id: I9b30edbfbcb65056b7f57355d75d180e3033d82e
---
 include/caffe/net.hpp                        |  10 +-
 src/caffe/layers/mkldnn_batch_norm_layer.cpp |  13 ++-
 src/caffe/net.cpp                            | 109 +++++++++++++++++--
 src/caffe/proto/caffe.proto                  |   1 +
 4 files changed, 123 insertions(+), 10 deletions(-)
 mode change 100644 => 100755 src/caffe/layers/mkldnn_batch_norm_layer.cpp
 mode change 100644 => 100755 src/caffe/net.cpp

diff --git a/include/caffe/net.hpp b/include/caffe/net.hpp
index 3359ac813..52d40ce15 100644
--- a/include/caffe/net.hpp
+++ b/include/caffe/net.hpp
@@ -312,7 +312,15 @@ class Net {
   */
   static void CompilationRuleFour(const NetParameter& param,
                              NetParameter* param_compiled);
-  
+
+  /**
+  * @brief This is rule that analyze layer if it is of type MKLDNNReLU and if that is the case
+  *        and previous layer which serves as input layer to MKLDNNReLU Layer is MKLDNNBN
+  *        then MKLDNNReLU layer can be dropped
+  */
+  static void CompilationRuleFuseBnRelu(const NetParameter& param,
+                                 NetParameter* param_compiled);
+
   /**
    * @brief If find "Conv--BN--Scale" in current network, merge BN and Scale layer into Convolution
    * layers, this optimization only works in caffe TEST phase now.
diff --git a/src/caffe/layers/mkldnn_batch_norm_layer.cpp b/src/caffe/layers/mkldnn_batch_norm_layer.cpp
old mode 100644
new mode 100755
index 2ef51947b..c8da5f853
--- a/src/caffe/layers/mkldnn_batch_norm_layer.cpp
+++ b/src/caffe/layers/mkldnn_batch_norm_layer.cpp
@@ -234,9 +234,20 @@ void MKLDNNBatchNormLayer<Dtype>::InitBatchNorm(const vector<Blob<Dtype>*>& bott
     EngineParser ep(subengines);
     unsigned subEngineIndex = 0;
     BatchNormFwd_pd = NULL;
+    bool relu = this->layer_param_.batch_norm_param().relu();
+    mkldnn::primitive_attr attr;
+    mkldnn::post_ops ops;
+    if (relu) {
+        ops.append_eltwise(1.f, eltwise_relu, 0.f, 0.f);
+        attr.set_post_ops(ops);
+    }
     for(; subEngineIndex < ep.getNumberOfSubEngines(); subEngineIndex++) {
       try {
-        BatchNormFwd_pd.reset(new batch_normalization_forward::primitive_desc(BatchNormFwd_desc,
+        if (relu)
+            BatchNormFwd_pd.reset(new batch_normalization_forward::primitive_desc(BatchNormFwd_desc, attr,
+                ep.getMKLDNNSubEngine(subEngineIndex)));
+        else
+            BatchNormFwd_pd.reset(new batch_normalization_forward::primitive_desc(BatchNormFwd_desc,
                 ep.getMKLDNNSubEngine(subEngineIndex)));
       }
       catch(...) {
diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
old mode 100644
new mode 100755
index 74040f1c1..36ff24e73
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -573,19 +573,24 @@ void Net<Dtype>::CompileNet(const NetParameter& param,
   param_temp2.clear_layer();   // Remove layers
   CompilationRuleTwo(param_temp, &param_temp2);
 
+  NetParameter param_temp3;  // temporary compiled param
+  param_temp3.CopyFrom(param_temp2);
+  param_temp3.clear_layer();   // Remove layers
+  CompilationRuleFuseBnRelu(param_temp2, &param_temp3);
+
 #ifdef DISABLE_CONV_SUM_FUSION
-  param_compiled->CopyFrom(param_temp2);
+  param_compiled->CopyFrom(param_temp3);
   param_compiled->clear_layer();    // Remove layers
-  CompilationRuleThree(param_temp2, param_compiled);
+  CompilationRuleThree(param_temp3, param_compiled);
 #else
-  NetParameter param_temp3;
-  param_temp3.CopyFrom(param_temp2);
-  param_temp3.clear_layer();
-  CompilationRuleThree(param_temp2, &param_temp3);
+  NetParameter param_temp4;
+  param_temp4.CopyFrom(param_temp3);
+  param_temp4.clear_layer();
+  CompilationRuleThree(param_temp3, &param_temp4);
 
-  param_compiled->CopyFrom(param_temp3);
+  param_compiled->CopyFrom(param_temp4);
   param_compiled->clear_layer();
-  CompilationRuleFour(param_temp3, param_compiled);
+  CompilationRuleFour(param_temp4, param_compiled);
 #endif 
 }
 
@@ -952,6 +957,94 @@ void Net<Dtype>::CompilationRuleFour(const NetParameter& param,
   return;
 }
 
+template <typename Dtype>
+void Net<Dtype>::CompilationRuleFuseBnRelu(const NetParameter& param,
+                                    NetParameter* param_compiled) {
+
+  std::set<std::string> layers_to_drop;
+  for (int i = 0; i < param.layer_size(); ++i) {
+    LayerParameter* layer_param =
+          (const_cast<NetParameter&>(param)).mutable_layer(i);
+    bool layer_included = true;
+
+    // Optimization rule BnRelu:
+    // - If we are having engine MKLDNN and Relu layer within a model
+    // and input bottom comes from  BatchNorm of engine MKLDNN
+    // then we can remove Relu layer
+    // and rename BatchNorm top blob after deleted Relu's top
+    // If current layer is BatchNorm of MKLDNN engine..
+    if (((layer_param->type().compare("BatchNorm") == 0) &&
+         ((layer_param->batch_norm_param().engine() == BatchNormParameter_Engine_MKLDNN) ||
+          ((layer_param->batch_norm_param().engine() == BatchNormParameter_Engine_DEFAULT) &&
+           (layer_param->has_engine() == false)  &&
+           (param.engine().compare("MKLDNN") == 0)) ||
+          (param.engine() == "" && layer_param->engine().compare("MKLDNN") == 0)))) {
+      std::vector<const LayerParameter*> consumer_layer_params;
+      GetBlobConsumers(consumer_layer_params,
+                       layer_param->top(0),
+                       param,
+                       i+1 < param.layer_size() ? i+1 : i);
+      const LayerParameter& consumer_layer_param =
+                                    consumer_layer_params.size() > 0 ?
+                                    *(consumer_layer_params[0]) : *layer_param;
+      // Consumer layer of blob produced by BN
+      // has to be Relu layer with one Input Blob
+
+      if ((consumer_layer_param.type().compare("ReLU") == 0) &&
+          ((consumer_layer_param.relu_param().engine() == ReLUParameter_Engine_MKLDNN) ||
+           ((consumer_layer_param.relu_param().engine() == ReLUParameter_Engine_DEFAULT) &&
+            (consumer_layer_param.engine().compare(0, 6, "MKLDNN") == 0 &&
+             consumer_layer_param.engine().find(":DLA", 6) == string::npos)) ||
+           ((consumer_layer_param.relu_param().engine() == ReLUParameter_Engine_DEFAULT) &&
+            (consumer_layer_param.engine() == "") &&
+            (param.engine().compare(0, 6, "MKLDNN") == 0 &&
+             param.engine().find(":DLA", 6) == string::npos))) &&
+             !consumer_layer_param.relu_param().negative_slope()) {
+             // negative_slope should be zero
+        string& batchnorm_top_blob_name =
+            const_cast<string&>(layer_param->top(0));
+
+        if(param.state().phase() == TEST) {
+          const string& relu_top_blob_name = consumer_layer_param.top(0);
+          // Mark Consumer layer (its name) as the one marked for dropping
+          layers_to_drop.insert(consumer_layer_param.name());
+
+          // Replace BatchNorm top name with ReLU top name
+          batchnorm_top_blob_name.resize(relu_top_blob_name.size());
+          batchnorm_top_blob_name.replace(0,
+                                          relu_top_blob_name.size(),
+                                          relu_top_blob_name);
+        }
+        // set relu flag in BN
+        layer_param->mutable_batch_norm_param()->set_relu(true);
+
+        if(param.state().phase() == TRAIN) {
+          if(i+1 < param.layer_size()) {
+            LayerParameter* relu_layer_param =
+              (const_cast<NetParameter&>(param)).mutable_layer(i+1);
+            relu_layer_param->mutable_relu_param()->set_fuse(true);
+            // LOG(INFO) <<  "Bn + Relu fused." << std::endl;
+          }
+        }
+      }
+    }
+
+    if(param.state().phase() == TEST) {
+      if (layers_to_drop.find(layer_param->name()) != layers_to_drop.end()) {
+        LOG_IF(INFO, Caffe::root_solver()) << "Dropped layer: "
+               << layer_param->name() << std::endl;
+        layer_included = false;
+        // Remove dropped layer from the list of layers to be dropped
+        layers_to_drop.erase(layers_to_drop.find(layer_param->name()));
+      }
+    }
+
+    if (layer_included) {
+      param_compiled->add_layer()->CopyFrom(*layer_param);
+    }
+  }
+}
+
 template <typename Dtype>
 void Net<Dtype>::GetBlobConsumers(
                   std::vector<const LayerParameter*>& consumer_blobs,
diff --git a/src/caffe/proto/caffe.proto b/src/caffe/proto/caffe.proto
index 439415c26..ea69365d7 100755
--- a/src/caffe/proto/caffe.proto
+++ b/src/caffe/proto/caffe.proto
@@ -933,6 +933,7 @@ message BatchNormParameter {
   optional FillerParameter bias_filler = 8; // The filler for the bias
   // Batch size used for statistics, 0 would use the batch size of bottom blob
   optional uint32 stats_batch_size = 9 [default = 0];
+  optional bool relu = 10 [default = false];
 }
 
 message SplitParameter {

From 76d9e640dc9f0d8a4d43ab38f9b5320d52e12d25 Mon Sep 17 00:00:00 2001
From: Daisy Deng <daisy.deng@intel.com>
Date: Wed, 20 Dec 2017 19:45:30 +0800
Subject: [PATCH 16/53] add default resnet50 and remove the
 train_dummydata.prototxt of ssd

---
 .../default_resnet50_16nodes/solver.prototxt  |   19 +
 .../train_val.prototxt                        | 3325 +++++++++++++++++
 .../SSD_300x300/train_dummydata.prototxt      | 1633 --------
 3 files changed, 3344 insertions(+), 1633 deletions(-)
 create mode 100644 models/intel_optimized_models/multinode/default_resnet50_16nodes/solver.prototxt
 create mode 100644 models/intel_optimized_models/multinode/default_resnet50_16nodes/train_val.prototxt
 delete mode 100644 models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/train_dummydata.prototxt

diff --git a/models/intel_optimized_models/multinode/default_resnet50_16nodes/solver.prototxt b/models/intel_optimized_models/multinode/default_resnet50_16nodes/solver.prototxt
new file mode 100644
index 000000000..27054d7d2
--- /dev/null
+++ b/models/intel_optimized_models/multinode/default_resnet50_16nodes/solver.prototxt
@@ -0,0 +1,19 @@
+net: "models/intel_optimized_models/multinode/default_resnet50_16nodes/train_val.prototxt"
+test_iter: 1000
+test_interval: 625
+test_initialization: false
+display: 40
+base_lr: 0.8
+lr_policy: "multistep"
+stepvalue:18750
+stepvalue:37500
+stepvalue:50000
+gamma: 0.1
+max_iter: 62556   # 56300
+warmup_iter: 3125 # 1281167 / 2048 * 5 epochs
+warmup_start_lr: 0.1
+momentum: 0.9
+weight_decay: 0.0001
+snapshot: 6250
+snapshot_prefix: "default_resnet_50_16_nodes"
+solver_mode: CPU
diff --git a/models/intel_optimized_models/multinode/default_resnet50_16nodes/train_val.prototxt b/models/intel_optimized_models/multinode/default_resnet50_16nodes/train_val.prototxt
new file mode 100644
index 000000000..de4efad2b
--- /dev/null
+++ b/models/intel_optimized_models/multinode/default_resnet50_16nodes/train_val.prototxt
@@ -0,0 +1,3325 @@
+name: "ResNet-50"
+bn_stats_batch_size: 32
+layer {
+  name: "data"
+  type: "Data"
+  top: "data"
+  top: "label"
+  include {
+    phase: TRAIN
+  }
+  transform_param {
+    mirror: true
+    crop_size: 224
+    scale: 0.0078125
+    mean_value: 104
+    mean_value: 117
+    mean_value: 123
+    random_aspect_ratio_param {
+      min_area_ratio: 0.08
+      max_area_ratio: 1
+      aspect_ratio_change: 0.75
+      resize_param {
+        interp_mode: CUBIC
+      }
+    }
+  }
+  data_param {
+    source: "examples/imagenet/ilsvrc12_train_lmdb"
+    batch_size: 128
+    backend: LMDB
+    prefetch: 2
+    shuffle: true
+  }
+}
+layer {
+  name: "data"
+  type: "Data"
+  top: "data"
+  top: "label"
+  include {
+    phase: TEST
+  }
+  transform_param {
+    mirror: false
+    crop_size: 224
+    scale: 0.0078125
+    mean_value: 104
+    mean_value: 117
+    mean_value: 123
+    random_resize_param {
+      min_size: 256
+      max_size: 256
+      resize_param {
+        interp_mode: CUBIC
+      }
+    }
+  }
+  data_param {
+    source: "examples/imagenet/ilsvrc12_val_lmdb"
+    batch_size: 50
+    backend: LMDB
+  }
+}
+
+layer {
+  bottom: "data"
+  top: "conv1"
+  name: "conv1"
+  type: "Convolution"
+  convolution_param {
+    num_output: 64
+    kernel_size: 7
+    pad: 3
+    stride: 2
+    weight_filler {
+      type: "msra"
+      variance_norm: FAN_OUT
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "conv1"
+  top: "conv1"
+  name: "bn_conv1"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "conv1"
+  top: "conv1"
+  name: "scale_conv1"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "conv1"
+  top: "conv1"
+  name: "conv1_relu"
+  type: "ReLU"
+  relu_param {
+  }
+}
+
+layer {
+  bottom: "conv1"
+  top: "pool1"
+  name: "pool1"
+  type: "Pooling"
+  pooling_param {
+    kernel_size: 3
+    stride: 2
+    pool: MAX
+  }
+}
+
+layer {
+  bottom: "pool1"
+  top: "res2a_branch1"
+  name: "res2a_branch1"
+  type: "Convolution"
+  convolution_param {
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2a_branch1"
+  top: "res2a_branch1"
+  name: "bn2a_branch1"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2a_branch1"
+  top: "res2a_branch1"
+  name: "scale2a_branch1"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "pool1"
+  top: "res2a_branch2a"
+  name: "res2a_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 64
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2a"
+  name: "bn2a_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2a"
+  name: "scale2a_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2a"
+  name: "res2a_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2b"
+  name: "res2a_branch2b"
+  type: "Convolution"
+  convolution_param {
+    num_output: 64
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2b"
+  name: "bn2a_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2b"
+  name: "scale2a_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2b"
+  name: "res2a_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2c"
+  name: "res2a_branch2c"
+  type: "Convolution"
+  convolution_param {
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2a_branch2c"
+  top: "res2a_branch2c"
+  name: "bn2a_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2a_branch2c"
+  top: "res2a_branch2c"
+  name: "scale2a_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2a_branch1"
+  bottom: "res2a_branch2c"
+  top: "res2a"
+  name: "res2a"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res2a"
+  top: "res2a"
+  name: "res2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2a"
+  top: "res2b_branch2a"
+  name: "res2b_branch2a"
+  type: "Convolution"
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2a"
+  name: "bn2b_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2a"
+  name: "scale2b_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2a"
+  name: "res2b_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2b"
+  name: "res2b_branch2b"
+  type: "Convolution"
+  convolution_param {
+    num_output: 64
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2b"
+  name: "bn2b_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2b"
+  name: "scale2b_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2b"
+  name: "res2b_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2c"
+  name: "res2b_branch2c"
+  type: "Convolution"
+  convolution_param {
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2b_branch2c"
+  top: "res2b_branch2c"
+  name: "bn2b_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2b_branch2c"
+  top: "res2b_branch2c"
+  name: "scale2b_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2a"
+  bottom: "res2b_branch2c"
+  top: "res2b"
+  name: "res2b"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res2b"
+  top: "res2b"
+  name: "res2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2b"
+  top: "res2c_branch2a"
+  name: "res2c_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 64
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2a"
+  name: "bn2c_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2a"
+  name: "scale2c_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2a"
+  name: "res2c_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2b"
+  name: "res2c_branch2b"
+  type: "Convolution"
+  convolution_param {
+    num_output: 64
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2b"
+  name: "bn2c_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2b"
+  name: "scale2c_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2b"
+  name: "res2c_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2c"
+  name: "res2c_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2c_branch2c"
+  top: "res2c_branch2c"
+  name: "bn2c_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+  filler { value: 0 }
+  }
+}
+
+layer {
+  bottom: "res2c_branch2c"
+  top: "res2c_branch2c"
+  name: "scale2c_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2b"
+  bottom: "res2c_branch2c"
+  top: "res2c"
+  name: "res2c"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res2c"
+  top: "res2c"
+  name: "res2c_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2c"
+  top: "res3a_branch1"
+  name: "res3a_branch1"
+  type: "Convolution"
+  convolution_param {
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 2
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3a_branch1"
+  top: "res3a_branch1"
+  name: "bn3a_branch1"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3a_branch1"
+  top: "res3a_branch1"
+  name: "scale3a_branch1"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2c"
+  top: "res3a_branch2a"
+  name: "res3a_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 128
+    kernel_size: 1
+    pad: 0
+    stride: 2
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2a"
+  name: "bn3a_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2a"
+  name: "scale3a_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2a"
+  name: "res3a_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2b"
+  name: "res3a_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 128
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2b"
+  name: "bn3a_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2b"
+  name: "scale3a_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2b"
+  name: "res3a_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2c"
+  name: "res3a_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3a_branch2c"
+  top: "res3a_branch2c"
+  name: "bn3a_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3a_branch2c"
+  top: "res3a_branch2c"
+  name: "scale3a_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3a_branch1"
+  bottom: "res3a_branch2c"
+  top: "res3a"
+  name: "res3a"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res3a"
+  top: "res3a"
+  name: "res3a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3a"
+  top: "res3b_branch2a"
+  name: "res3b_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 128
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2a"
+  name: "bn3b_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2a"
+  name: "scale3b_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2a"
+  name: "res3b_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2b"
+  name: "res3b_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 128
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2b"
+  name: "bn3b_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2b"
+  name: "scale3b_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2b"
+  name: "res3b_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2c"
+  name: "res3b_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3b_branch2c"
+  top: "res3b_branch2c"
+  name: "bn3b_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3b_branch2c"
+  top: "res3b_branch2c"
+  name: "scale3b_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3a"
+  bottom: "res3b_branch2c"
+  top: "res3b"
+  name: "res3b"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res3b"
+  top: "res3b"
+  name: "res3b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3b"
+  top: "res3c_branch2a"
+  name: "res3c_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 128
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2a"
+  name: "bn3c_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2a"
+  name: "scale3c_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2a"
+  name: "res3c_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2b"
+  name: "res3c_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 128
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2b"
+  name: "bn3c_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2b"
+  name: "scale3c_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2b"
+  name: "res3c_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2c"
+  name: "res3c_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3c_branch2c"
+  top: "res3c_branch2c"
+  name: "bn3c_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3c_branch2c"
+  top: "res3c_branch2c"
+  name: "scale3c_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3b"
+  bottom: "res3c_branch2c"
+  top: "res3c"
+  name: "res3c"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res3c"
+  top: "res3c"
+  name: "res3c_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3c"
+  top: "res3d_branch2a"
+  name: "res3d_branch2a"
+  type: "Convolution"
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2a"
+  name: "bn3d_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2a"
+  name: "scale3d_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2a"
+  name: "res3d_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2b"
+  name: "res3d_branch2b"
+  type: "Convolution"
+  convolution_param {
+    num_output: 128
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2b"
+  name: "bn3d_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2b"
+  name: "scale3d_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2b"
+  name: "res3d_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2c"
+  name: "res3d_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3d_branch2c"
+  top: "res3d_branch2c"
+  name: "bn3d_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+  filler { value: 0 }
+  }
+}
+
+layer {
+  bottom: "res3d_branch2c"
+  top: "res3d_branch2c"
+  name: "scale3d_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3c"
+  bottom: "res3d_branch2c"
+  top: "res3d"
+  name: "res3d"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res3d"
+  top: "res3d"
+  name: "res3d_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3d"
+  top: "res4a_branch1"
+  name: "res4a_branch1"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 2
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4a_branch1"
+  top: "res4a_branch1"
+  name: "bn4a_branch1"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4a_branch1"
+  top: "res4a_branch1"
+  name: "scale4a_branch1"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3d"
+  top: "res4a_branch2a"
+  name: "res4a_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 2
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2a"
+  name: "bn4a_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2a"
+  name: "scale4a_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2a"
+  name: "res4a_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2b"
+  name: "res4a_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2b"
+  name: "bn4a_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2b"
+  name: "scale4a_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2b"
+  name: "res4a_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2c"
+  name: "res4a_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4a_branch2c"
+  top: "res4a_branch2c"
+  name: "bn4a_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4a_branch2c"
+  top: "res4a_branch2c"
+  name: "scale4a_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4a_branch1"
+  bottom: "res4a_branch2c"
+  top: "res4a"
+  name: "res4a"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res4a"
+  top: "res4a"
+  name: "res4a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4a"
+  top: "res4b_branch2a"
+  name: "res4b_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2a"
+  name: "bn4b_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2a"
+  name: "scale4b_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2a"
+  name: "res4b_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2b"
+  name: "res4b_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2b"
+  name: "bn4b_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2b"
+  name: "scale4b_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2b"
+  name: "res4b_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2c"
+  name: "res4b_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4b_branch2c"
+  top: "res4b_branch2c"
+  name: "bn4b_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4b_branch2c"
+  top: "res4b_branch2c"
+  name: "scale4b_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4a"
+  bottom: "res4b_branch2c"
+  top: "res4b"
+  name: "res4b"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res4b"
+  top: "res4b"
+  name: "res4b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4b"
+  top: "res4c_branch2a"
+  name: "res4c_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2a"
+  name: "bn4c_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2a"
+  name: "scale4c_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2a"
+  name: "res4c_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2b"
+  name: "res4c_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2b"
+  name: "bn4c_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2b"
+  name: "scale4c_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2b"
+  name: "res4c_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2c"
+  name: "res4c_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4c_branch2c"
+  top: "res4c_branch2c"
+  name: "bn4c_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4c_branch2c"
+  top: "res4c_branch2c"
+  name: "scale4c_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4b"
+  bottom: "res4c_branch2c"
+  top: "res4c"
+  name: "res4c"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res4c"
+  top: "res4c"
+  name: "res4c_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4c"
+  top: "res4d_branch2a"
+  name: "res4d_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2a"
+  name: "bn4d_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2a"
+  name: "scale4d_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2a"
+  name: "res4d_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2b"
+  name: "res4d_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2b"
+  name: "bn4d_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2b"
+  name: "scale4d_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2b"
+  name: "res4d_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2c"
+  name: "res4d_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4d_branch2c"
+  top: "res4d_branch2c"
+  name: "bn4d_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4d_branch2c"
+  top: "res4d_branch2c"
+  name: "scale4d_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4c"
+  bottom: "res4d_branch2c"
+  top: "res4d"
+  name: "res4d"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res4d"
+  top: "res4d"
+  name: "res4d_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4d"
+  top: "res4e_branch2a"
+  name: "res4e_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2a"
+  name: "bn4e_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2a"
+  name: "scale4e_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2a"
+  name: "res4e_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2b"
+  name: "res4e_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2b"
+  name: "bn4e_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2b"
+  name: "scale4e_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2b"
+  name: "res4e_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2c"
+  name: "res4e_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4e_branch2c"
+  top: "res4e_branch2c"
+  name: "bn4e_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4e_branch2c"
+  top: "res4e_branch2c"
+  name: "scale4e_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4d"
+  bottom: "res4e_branch2c"
+  top: "res4e"
+  name: "res4e"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res4e"
+  top: "res4e"
+  name: "res4e_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4e"
+  top: "res4f_branch2a"
+  name: "res4f_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2a"
+  name: "bn4f_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2a"
+  name: "scale4f_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2a"
+  name: "res4f_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2b"
+  name: "res4f_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2b"
+  name: "bn4f_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2b"
+  name: "scale4f_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2b"
+  name: "res4f_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2c"
+  name: "res4f_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4f_branch2c"
+  top: "res4f_branch2c"
+  name: "bn4f_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+  filler { value: 0 }
+  }
+}
+
+layer {
+  bottom: "res4f_branch2c"
+  top: "res4f_branch2c"
+  name: "scale4f_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4e"
+  bottom: "res4f_branch2c"
+  top: "res4f"
+  name: "res4f"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res4f"
+  top: "res4f"
+  name: "res4f_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4f"
+  top: "res5a_branch1"
+  name: "res5a_branch1"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 2048
+    kernel_size: 1
+    pad: 0
+    stride: 2
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5a_branch1"
+  top: "res5a_branch1"
+  name: "bn5a_branch1"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5a_branch1"
+  top: "res5a_branch1"
+  name: "scale5a_branch1"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4f"
+  top: "res5a_branch2a"
+  name: "res5a_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 2
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2a"
+  name: "bn5a_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2a"
+  name: "scale5a_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2a"
+  name: "res5a_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2b"
+  name: "res5a_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2b"
+  name: "bn5a_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2b"
+  name: "scale5a_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2b"
+  name: "res5a_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2c"
+  name: "res5a_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 2048
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5a_branch2c"
+  top: "res5a_branch2c"
+  name: "bn5a_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5a_branch2c"
+  top: "res5a_branch2c"
+  name: "scale5a_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5a_branch1"
+  bottom: "res5a_branch2c"
+  top: "res5a"
+  name: "res5a"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res5a"
+  top: "res5a"
+  name: "res5a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5a"
+  top: "res5b_branch2a"
+  name: "res5b_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2a"
+  name: "bn5b_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2a"
+  name: "scale5b_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2a"
+  name: "res5b_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2b"
+  name: "res5b_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2b"
+  name: "bn5b_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2b"
+  name: "scale5b_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2b"
+  name: "res5b_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2c"
+  name: "res5b_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 2048
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5b_branch2c"
+  top: "res5b_branch2c"
+  name: "bn5b_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5b_branch2c"
+  top: "res5b_branch2c"
+  name: "scale5b_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5a"
+  bottom: "res5b_branch2c"
+  top: "res5b"
+  name: "res5b"
+  type: "Eltwise"
+  eltwise_param {
+  }
+}
+
+layer {
+  bottom: "res5b"
+  top: "res5b"
+  name: "res5b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5b"
+  top: "res5c_branch2a"
+  name: "res5c_branch2a"
+  type: "Convolution"
+  convolution_param {
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2a"
+  name: "bn5c_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2a"
+  name: "scale5c_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2a"
+  name: "res5c_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2b"
+  name: "res5c_branch2b"
+  type: "Convolution"
+  convolution_param {
+    num_output: 512
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2b"
+  name: "bn5c_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2b"
+  name: "scale5c_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2b"
+  name: "res5c_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+  }
+}
+
+layer {
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2c"
+  name: "res5c_branch2c"
+  type: "Convolution"
+  convolution_param {
+    num_output: 2048
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5c_branch2c"
+  top: "res5c_branch2c"
+  name: "bn5c_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+  filler { value: 0 }
+  }
+}
+
+layer {
+  bottom: "res5c_branch2c"
+  top: "res5c_branch2c"
+  name: "scale5c_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5b"
+  bottom: "res5c_branch2c"
+  top: "res5c"
+  name: "res5c"
+  type: "Eltwise"
+  eltwise_param {
+  }
+}
+
+layer {
+  bottom: "res5c"
+  top: "res5c"
+  name: "res5c_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5c"
+  top: "pool5"
+  name: "pool5"
+  type: "Pooling"
+  pooling_param {
+    kernel_size: 7
+    stride: 1
+    pool: AVE
+  }
+}
+
+layer {
+  bottom: "pool5"
+  top: "fc1000"
+  name: "fc1000"
+  type: "InnerProduct"
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "fc1000"
+  bottom: "label"
+  top: "loss"
+  name: "prob"
+  type: "SoftmaxWithLoss"
+  include {
+      phase: TRAIN
+  }
+}
+layer {
+  name: "loss3/top-1"
+  type: "Accuracy"
+  bottom: "fc1000"
+  bottom: "label"
+  top: "loss3/top-1"
+}
+layer {
+  name: "loss3/top-5"
+  type: "Accuracy"
+  bottom: "fc1000"
+  bottom: "label"
+  top: "loss3/top-5"
+  accuracy_param {
+    top_k: 5
+  }
+}
diff --git a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/train_dummydata.prototxt b/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/train_dummydata.prototxt
deleted file mode 100644
index 41cf79ab3..000000000
--- a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/train_dummydata.prototxt
+++ /dev/null
@@ -1,1633 +0,0 @@
-name: "VGG_VOC0712_SSD_300x300_train"
-layer {
-  name: "data"
-  type: "DummyData"
-  top: "data"
-  dummy_data_param {
-    data_filler {
-      type: "constant"
-      value: 0.01 
-    }    
-    shape {
-      dim: 32
-      dim: 3
-      dim: 300
-      dim: 300
-    }    
-  }
-}
-layer {
-  name: "data"
-  type: "DummyData"
-  top: "label"
-  dummy_data_param {
-    data_filler {
-      type: "constant"
-      value: 1
-    }    
-    shape {
-      dim: 1
-      dim: 1
-      dim: 1
-      dim: 8
-    }    
-  }
-}
-layer {
-  name: "conv1_1"
-  type: "Convolution"
-  bottom: "data"
-  top: "conv1_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 64
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "relu1_1"
-  type: "ReLU"
-  bottom: "conv1_1"
-  top: "conv1_1"
-}
-layer {
-  name: "conv1_2"
-  type: "Convolution"
-  bottom: "conv1_1"
-  top: "conv1_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 64
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "relu1_2"
-  type: "ReLU"
-  bottom: "conv1_2"
-  top: "conv1_2"
-}
-layer {
-  name: "pool1"
-  type: "Pooling"
-  bottom: "conv1_2"
-  top: "pool1"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-  }
-}
-layer {
-  name: "conv2_1"
-  type: "Convolution"
-  bottom: "pool1"
-  top: "conv2_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 128
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "relu2_1"
-  type: "ReLU"
-  bottom: "conv2_1"
-  top: "conv2_1"
-}
-layer {
-  name: "conv2_2"
-  type: "Convolution"
-  bottom: "conv2_1"
-  top: "conv2_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 128
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "relu2_2"
-  type: "ReLU"
-  bottom: "conv2_2"
-  top: "conv2_2"
-}
-layer {
-  name: "pool2"
-  type: "Pooling"
-  bottom: "conv2_2"
-  top: "pool2"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-  }
-}
-layer {
-  name: "conv3_1"
-  type: "Convolution"
-  bottom: "pool2"
-  top: "conv3_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "relu3_1"
-  type: "ReLU"
-  bottom: "conv3_1"
-  top: "conv3_1"
-}
-layer {
-  name: "conv3_2"
-  type: "Convolution"
-  bottom: "conv3_1"
-  top: "conv3_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "relu3_2"
-  type: "ReLU"
-  bottom: "conv3_2"
-  top: "conv3_2"
-}
-layer {
-  name: "conv3_3"
-  type: "Convolution"
-  bottom: "conv3_2"
-  top: "conv3_3"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "relu3_3"
-  type: "ReLU"
-  bottom: "conv3_3"
-  top: "conv3_3"
-}
-layer {
-  name: "pool3"
-  type: "Pooling"
-  bottom: "conv3_3"
-  top: "pool3"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-  }
-}
-layer {
-  name: "conv4_1"
-  type: "Convolution"
-  bottom: "pool3"
-  top: "conv4_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "relu4_1"
-  type: "ReLU"
-  bottom: "conv4_1"
-  top: "conv4_1"
-}
-layer {
-  name: "conv4_2"
-  type: "Convolution"
-  bottom: "conv4_1"
-  top: "conv4_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "relu4_2"
-  type: "ReLU"
-  bottom: "conv4_2"
-  top: "conv4_2"
-}
-layer {
-  name: "conv4_3"
-  type: "Convolution"
-  bottom: "conv4_2"
-  top: "conv4_3"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "relu4_3"
-  type: "ReLU"
-  bottom: "conv4_3"
-  top: "conv4_3"
-}
-layer {
-  name: "pool4"
-  type: "Pooling"
-  bottom: "conv4_3"
-  top: "pool4"
-  pooling_param {
-    pool: MAX
-    kernel_size: 2
-    stride: 2
-  }
-}
-layer {
-  name: "conv5_1"
-  type: "Convolution"
-  bottom: "pool4"
-  top: "conv5_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-    dilation: 1
-  }
-}
-layer {
-  name: "relu5_1"
-  type: "ReLU"
-  bottom: "conv5_1"
-  top: "conv5_1"
-}
-layer {
-  name: "conv5_2"
-  type: "Convolution"
-  bottom: "conv5_1"
-  top: "conv5_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-    dilation: 1
-  }
-}
-layer {
-  name: "relu5_2"
-  type: "ReLU"
-  bottom: "conv5_2"
-  top: "conv5_2"
-}
-layer {
-  name: "conv5_3"
-  type: "Convolution"
-  bottom: "conv5_2"
-  top: "conv5_3"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-    dilation: 1
-  }
-}
-layer {
-  name: "relu5_3"
-  type: "ReLU"
-  bottom: "conv5_3"
-  top: "conv5_3"
-}
-layer {
-  name: "pool5"
-  type: "Pooling"
-  bottom: "conv5_3"
-  top: "pool5"
-  pooling_param {
-    pool: MAX
-    kernel_size: 3
-    stride: 1
-    pad: 1
-  }
-}
-layer {
-  name: "fc6"
-  type: "Convolution"
-  bottom: "pool5"
-  top: "fc6"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 1024
-    pad: 6
-    kernel_size: 3
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-    dilation: 6
-  }
-}
-layer {
-  name: "relu6"
-  type: "ReLU"
-  bottom: "fc6"
-  top: "fc6"
-}
-layer {
-  name: "fc7"
-  type: "Convolution"
-  bottom: "fc6"
-  top: "fc7"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 1024
-    kernel_size: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "relu7"
-  type: "ReLU"
-  bottom: "fc7"
-  top: "fc7"
-}
-layer {
-  name: "conv6_1"
-  type: "Convolution"
-  bottom: "fc7"
-  top: "conv6_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv6_1_relu"
-  type: "ReLU"
-  bottom: "conv6_1"
-  top: "conv6_1"
-}
-layer {
-  name: "conv6_2"
-  type: "Convolution"
-  bottom: "conv6_1"
-  top: "conv6_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 512
-    pad: 1
-    kernel_size: 3
-    stride: 2
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv6_2_relu"
-  type: "ReLU"
-  bottom: "conv6_2"
-  top: "conv6_2"
-}
-layer {
-  name: "conv7_1"
-  type: "Convolution"
-  bottom: "conv6_2"
-  top: "conv7_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 128
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv7_1_relu"
-  type: "ReLU"
-  bottom: "conv7_1"
-  top: "conv7_1"
-}
-layer {
-  name: "conv7_2"
-  type: "Convolution"
-  bottom: "conv7_1"
-  top: "conv7_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 1
-    kernel_size: 3
-    stride: 2
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv7_2_relu"
-  type: "ReLU"
-  bottom: "conv7_2"
-  top: "conv7_2"
-}
-layer {
-  name: "conv8_1"
-  type: "Convolution"
-  bottom: "conv7_2"
-  top: "conv8_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 128
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv8_1_relu"
-  type: "ReLU"
-  bottom: "conv8_1"
-  top: "conv8_1"
-}
-layer {
-  name: "conv8_2"
-  type: "Convolution"
-  bottom: "conv8_1"
-  top: "conv8_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 0
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv8_2_relu"
-  type: "ReLU"
-  bottom: "conv8_2"
-  top: "conv8_2"
-}
-layer {
-  name: "conv9_1"
-  type: "Convolution"
-  bottom: "conv8_2"
-  top: "conv9_1"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 128
-    pad: 0
-    kernel_size: 1
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv9_1_relu"
-  type: "ReLU"
-  bottom: "conv9_1"
-  top: "conv9_1"
-}
-layer {
-  name: "conv9_2"
-  type: "Convolution"
-  bottom: "conv9_1"
-  top: "conv9_2"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 256
-    pad: 0
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv9_2_relu"
-  type: "ReLU"
-  bottom: "conv9_2"
-  top: "conv9_2"
-}
-layer {
-  name: "conv4_3_norm"
-  type: "Normalize"
-  bottom: "conv4_3"
-  top: "conv4_3_norm"
-  norm_param {
-    across_spatial: false
-    scale_filler {
-      type: "constant"
-      value: 20
-    }
-    channel_shared: false
-  }
-}
-layer {
-  name: "conv4_3_norm_mbox_loc"
-  type: "Convolution"
-  bottom: "conv4_3_norm"
-  top: "conv4_3_norm_mbox_loc"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 16
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv4_3_norm_mbox_loc_perm"
-  type: "Permute"
-  bottom: "conv4_3_norm_mbox_loc"
-  top: "conv4_3_norm_mbox_loc_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv4_3_norm_mbox_loc_flat"
-  type: "Flatten"
-  bottom: "conv4_3_norm_mbox_loc_perm"
-  top: "conv4_3_norm_mbox_loc_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv4_3_norm_mbox_conf"
-  type: "Convolution"
-  bottom: "conv4_3_norm"
-  top: "conv4_3_norm_mbox_conf"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 84
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv4_3_norm_mbox_conf_perm"
-  type: "Permute"
-  bottom: "conv4_3_norm_mbox_conf"
-  top: "conv4_3_norm_mbox_conf_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv4_3_norm_mbox_conf_flat"
-  type: "Flatten"
-  bottom: "conv4_3_norm_mbox_conf_perm"
-  top: "conv4_3_norm_mbox_conf_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv4_3_norm_mbox_priorbox"
-  type: "PriorBox"
-  bottom: "conv4_3_norm"
-  bottom: "data"
-  top: "conv4_3_norm_mbox_priorbox"
-  prior_box_param {
-    min_size: 30.0
-    max_size: 60.0
-    aspect_ratio: 2
-    flip: true
-    clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 8
-    offset: 0.5
-  }
-}
-layer {
-  name: "fc7_mbox_loc"
-  type: "Convolution"
-  bottom: "fc7"
-  top: "fc7_mbox_loc"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 24
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "fc7_mbox_loc_perm"
-  type: "Permute"
-  bottom: "fc7_mbox_loc"
-  top: "fc7_mbox_loc_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "fc7_mbox_loc_flat"
-  type: "Flatten"
-  bottom: "fc7_mbox_loc_perm"
-  top: "fc7_mbox_loc_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "fc7_mbox_conf"
-  type: "Convolution"
-  bottom: "fc7"
-  top: "fc7_mbox_conf"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 126
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "fc7_mbox_conf_perm"
-  type: "Permute"
-  bottom: "fc7_mbox_conf"
-  top: "fc7_mbox_conf_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "fc7_mbox_conf_flat"
-  type: "Flatten"
-  bottom: "fc7_mbox_conf_perm"
-  top: "fc7_mbox_conf_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "fc7_mbox_priorbox"
-  type: "PriorBox"
-  bottom: "fc7"
-  bottom: "data"
-  top: "fc7_mbox_priorbox"
-  prior_box_param {
-    min_size: 60.0
-    max_size: 111.0
-    aspect_ratio: 2
-    aspect_ratio: 3
-    flip: true
-    clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 16
-    offset: 0.5
-  }
-}
-layer {
-  name: "conv6_2_mbox_loc"
-  type: "Convolution"
-  bottom: "conv6_2"
-  top: "conv6_2_mbox_loc"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 24
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv6_2_mbox_loc_perm"
-  type: "Permute"
-  bottom: "conv6_2_mbox_loc"
-  top: "conv6_2_mbox_loc_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv6_2_mbox_loc_flat"
-  type: "Flatten"
-  bottom: "conv6_2_mbox_loc_perm"
-  top: "conv6_2_mbox_loc_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv6_2_mbox_conf"
-  type: "Convolution"
-  bottom: "conv6_2"
-  top: "conv6_2_mbox_conf"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 126
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv6_2_mbox_conf_perm"
-  type: "Permute"
-  bottom: "conv6_2_mbox_conf"
-  top: "conv6_2_mbox_conf_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv6_2_mbox_conf_flat"
-  type: "Flatten"
-  bottom: "conv6_2_mbox_conf_perm"
-  top: "conv6_2_mbox_conf_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv6_2_mbox_priorbox"
-  type: "PriorBox"
-  bottom: "conv6_2"
-  bottom: "data"
-  top: "conv6_2_mbox_priorbox"
-  prior_box_param {
-    min_size: 111.0
-    max_size: 162.0
-    aspect_ratio: 2
-    aspect_ratio: 3
-    flip: true
-    clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 32
-    offset: 0.5
-  }
-}
-layer {
-  name: "conv7_2_mbox_loc"
-  type: "Convolution"
-  bottom: "conv7_2"
-  top: "conv7_2_mbox_loc"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 24
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv7_2_mbox_loc_perm"
-  type: "Permute"
-  bottom: "conv7_2_mbox_loc"
-  top: "conv7_2_mbox_loc_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv7_2_mbox_loc_flat"
-  type: "Flatten"
-  bottom: "conv7_2_mbox_loc_perm"
-  top: "conv7_2_mbox_loc_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv7_2_mbox_conf"
-  type: "Convolution"
-  bottom: "conv7_2"
-  top: "conv7_2_mbox_conf"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 126
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv7_2_mbox_conf_perm"
-  type: "Permute"
-  bottom: "conv7_2_mbox_conf"
-  top: "conv7_2_mbox_conf_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv7_2_mbox_conf_flat"
-  type: "Flatten"
-  bottom: "conv7_2_mbox_conf_perm"
-  top: "conv7_2_mbox_conf_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv7_2_mbox_priorbox"
-  type: "PriorBox"
-  bottom: "conv7_2"
-  bottom: "data"
-  top: "conv7_2_mbox_priorbox"
-  prior_box_param {
-    min_size: 162.0
-    max_size: 213.0
-    aspect_ratio: 2
-    aspect_ratio: 3
-    flip: true
-    clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 64
-    offset: 0.5
-  }
-}
-layer {
-  name: "conv8_2_mbox_loc"
-  type: "Convolution"
-  bottom: "conv8_2"
-  top: "conv8_2_mbox_loc"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 16
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv8_2_mbox_loc_perm"
-  type: "Permute"
-  bottom: "conv8_2_mbox_loc"
-  top: "conv8_2_mbox_loc_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv8_2_mbox_loc_flat"
-  type: "Flatten"
-  bottom: "conv8_2_mbox_loc_perm"
-  top: "conv8_2_mbox_loc_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv8_2_mbox_conf"
-  type: "Convolution"
-  bottom: "conv8_2"
-  top: "conv8_2_mbox_conf"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 84
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv8_2_mbox_conf_perm"
-  type: "Permute"
-  bottom: "conv8_2_mbox_conf"
-  top: "conv8_2_mbox_conf_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv8_2_mbox_conf_flat"
-  type: "Flatten"
-  bottom: "conv8_2_mbox_conf_perm"
-  top: "conv8_2_mbox_conf_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv8_2_mbox_priorbox"
-  type: "PriorBox"
-  bottom: "conv8_2"
-  bottom: "data"
-  top: "conv8_2_mbox_priorbox"
-  prior_box_param {
-    min_size: 213.0
-    max_size: 264.0
-    aspect_ratio: 2
-    flip: true
-    clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 100
-    offset: 0.5
-  }
-}
-layer {
-  name: "conv9_2_mbox_loc"
-  type: "Convolution"
-  bottom: "conv9_2"
-  top: "conv9_2_mbox_loc"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 16
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv9_2_mbox_loc_perm"
-  type: "Permute"
-  bottom: "conv9_2_mbox_loc"
-  top: "conv9_2_mbox_loc_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv9_2_mbox_loc_flat"
-  type: "Flatten"
-  bottom: "conv9_2_mbox_loc_perm"
-  top: "conv9_2_mbox_loc_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv9_2_mbox_conf"
-  type: "Convolution"
-  bottom: "conv9_2"
-  top: "conv9_2_mbox_conf"
-  param {
-    lr_mult: 1
-    decay_mult: 1
-  }
-  param {
-    lr_mult: 2
-    decay_mult: 0
-  }
-  convolution_param {
-    num_output: 84
-    pad: 1
-    kernel_size: 3
-    stride: 1
-    weight_filler {
-      type: "xavier"
-    }
-    bias_filler {
-      type: "constant"
-      value: 0
-    }
-  }
-}
-layer {
-  name: "conv9_2_mbox_conf_perm"
-  type: "Permute"
-  bottom: "conv9_2_mbox_conf"
-  top: "conv9_2_mbox_conf_perm"
-  permute_param {
-    order: 0
-    order: 2
-    order: 3
-    order: 1
-  }
-}
-layer {
-  name: "conv9_2_mbox_conf_flat"
-  type: "Flatten"
-  bottom: "conv9_2_mbox_conf_perm"
-  top: "conv9_2_mbox_conf_flat"
-  flatten_param {
-    axis: 1
-  }
-}
-layer {
-  name: "conv9_2_mbox_priorbox"
-  type: "PriorBox"
-  bottom: "conv9_2"
-  bottom: "data"
-  top: "conv9_2_mbox_priorbox"
-  prior_box_param {
-    min_size: 264.0
-    max_size: 315.0
-    aspect_ratio: 2
-    flip: true
-    clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 300
-    offset: 0.5
-  }
-}
-layer {
-  name: "mbox_loc"
-  type: "Concat"
-  bottom: "conv4_3_norm_mbox_loc_flat"
-  bottom: "fc7_mbox_loc_flat"
-  bottom: "conv6_2_mbox_loc_flat"
-  bottom: "conv7_2_mbox_loc_flat"
-  bottom: "conv8_2_mbox_loc_flat"
-  bottom: "conv9_2_mbox_loc_flat"
-  top: "mbox_loc"
-  concat_param {
-    axis: 1
-  }
-    engine: "CAFFE"
-}
-layer {
-  name: "mbox_conf"
-  type: "Concat"
-  bottom: "conv4_3_norm_mbox_conf_flat"
-  bottom: "fc7_mbox_conf_flat"
-  bottom: "conv6_2_mbox_conf_flat"
-  bottom: "conv7_2_mbox_conf_flat"
-  bottom: "conv8_2_mbox_conf_flat"
-  bottom: "conv9_2_mbox_conf_flat"
-  top: "mbox_conf"
-  concat_param {
-    axis: 1
-  }
-    engine: "CAFFE"
-}
-layer {
-  name: "mbox_priorbox"
-  type: "Concat"
-  bottom: "conv4_3_norm_mbox_priorbox"
-  bottom: "fc7_mbox_priorbox"
-  bottom: "conv6_2_mbox_priorbox"
-  bottom: "conv7_2_mbox_priorbox"
-  bottom: "conv8_2_mbox_priorbox"
-  bottom: "conv9_2_mbox_priorbox"
-  top: "mbox_priorbox"
-  concat_param {
-    axis: 2
-  }
-  engine: "CAFFE"
-}
-layer {
-  name: "mbox_loss"
-  type: "MultiBoxLoss"
-  bottom: "mbox_loc"
-  bottom: "mbox_conf"
-  bottom: "mbox_priorbox"
-  bottom: "label"
-  top: "mbox_loss"
-  include {
-    phase: TRAIN
-  }
-  propagate_down: true
-  propagate_down: true
-  propagate_down: false
-  propagate_down: false
-  loss_param {
-    normalization: VALID
-  }
-  multibox_loss_param {
-    loc_loss_type: SMOOTH_L1
-    conf_loss_type: SOFTMAX
-    loc_weight: 1.0
-    num_classes: 21
-    share_location: true
-    match_type: PER_PREDICTION
-    overlap_threshold: 0.5
-    use_prior_for_matching: true
-    background_label_id: 0
-    use_difficult_gt: true
-    neg_pos_ratio: 3.0
-    neg_overlap: 0.5
-    code_type: CENTER_SIZE
-    ignore_cross_boundary_bbox: false
-    mining_type: MAX_NEGATIVE
-  }
-}
-

From b27798a0d89a5504c9fa52ba196c8a8dda2a03ea Mon Sep 17 00:00:00 2001
From: "Zhang, Guoming" <guoming.zhang@intel.com>
Date: Thu, 21 Dec 2017 21:34:29 +0800
Subject: [PATCH 17/53] Fix for the issues found by ut.

---
 src/caffe/net.cpp | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
index 74040f1c1..49e35f699 100644
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -754,6 +754,7 @@ void Net<Dtype>::CompilationRuleTwo(const NetParameter& param,
             use_negative_slope = true;
         } else {
             layer_param->mutable_convolution_param()->set_relu(true);
+            layer_param->mutable_convolution_param()->set_negative_slope(0);
         }
         if(param.state().phase() == TRAIN && !use_negative_slope) {
           if(i+1 < param.layer_size()) {

From d44aaeff882de34addc3fe357ba3b6e004970980 Mon Sep 17 00:00:00 2001
From: "Pan, Daoxin" <daoxin.pan@intel.com>
Date: Fri, 22 Dec 2017 09:30:02 +0800
Subject: [PATCH 18/53] Revert "Add codes to enable BN+Relu's fusion."

This reverts commit 5d7497ff29812fdf31878dfbaa000948b7b06e77.

Change-Id: Ic5222ecb54389be579857c4a75574f5548cbb8ca
---
 include/caffe/net.hpp                        |  10 +-
 src/caffe/layers/mkldnn_batch_norm_layer.cpp |  13 +--
 src/caffe/net.cpp                            | 109 ++-----------------
 src/caffe/proto/caffe.proto                  |   1 -
 4 files changed, 10 insertions(+), 123 deletions(-)
 mode change 100755 => 100644 src/caffe/layers/mkldnn_batch_norm_layer.cpp
 mode change 100755 => 100644 src/caffe/net.cpp

diff --git a/include/caffe/net.hpp b/include/caffe/net.hpp
index 52d40ce15..3359ac813 100644
--- a/include/caffe/net.hpp
+++ b/include/caffe/net.hpp
@@ -312,15 +312,7 @@ class Net {
   */
   static void CompilationRuleFour(const NetParameter& param,
                              NetParameter* param_compiled);
-
-  /**
-  * @brief This is rule that analyze layer if it is of type MKLDNNReLU and if that is the case
-  *        and previous layer which serves as input layer to MKLDNNReLU Layer is MKLDNNBN
-  *        then MKLDNNReLU layer can be dropped
-  */
-  static void CompilationRuleFuseBnRelu(const NetParameter& param,
-                                 NetParameter* param_compiled);
-
+  
   /**
    * @brief If find "Conv--BN--Scale" in current network, merge BN and Scale layer into Convolution
    * layers, this optimization only works in caffe TEST phase now.
diff --git a/src/caffe/layers/mkldnn_batch_norm_layer.cpp b/src/caffe/layers/mkldnn_batch_norm_layer.cpp
old mode 100755
new mode 100644
index c8da5f853..2ef51947b
--- a/src/caffe/layers/mkldnn_batch_norm_layer.cpp
+++ b/src/caffe/layers/mkldnn_batch_norm_layer.cpp
@@ -234,20 +234,9 @@ void MKLDNNBatchNormLayer<Dtype>::InitBatchNorm(const vector<Blob<Dtype>*>& bott
     EngineParser ep(subengines);
     unsigned subEngineIndex = 0;
     BatchNormFwd_pd = NULL;
-    bool relu = this->layer_param_.batch_norm_param().relu();
-    mkldnn::primitive_attr attr;
-    mkldnn::post_ops ops;
-    if (relu) {
-        ops.append_eltwise(1.f, eltwise_relu, 0.f, 0.f);
-        attr.set_post_ops(ops);
-    }
     for(; subEngineIndex < ep.getNumberOfSubEngines(); subEngineIndex++) {
       try {
-        if (relu)
-            BatchNormFwd_pd.reset(new batch_normalization_forward::primitive_desc(BatchNormFwd_desc, attr,
-                ep.getMKLDNNSubEngine(subEngineIndex)));
-        else
-            BatchNormFwd_pd.reset(new batch_normalization_forward::primitive_desc(BatchNormFwd_desc,
+        BatchNormFwd_pd.reset(new batch_normalization_forward::primitive_desc(BatchNormFwd_desc,
                 ep.getMKLDNNSubEngine(subEngineIndex)));
       }
       catch(...) {
diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
old mode 100755
new mode 100644
index 36ff24e73..74040f1c1
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -573,24 +573,19 @@ void Net<Dtype>::CompileNet(const NetParameter& param,
   param_temp2.clear_layer();   // Remove layers
   CompilationRuleTwo(param_temp, &param_temp2);
 
-  NetParameter param_temp3;  // temporary compiled param
-  param_temp3.CopyFrom(param_temp2);
-  param_temp3.clear_layer();   // Remove layers
-  CompilationRuleFuseBnRelu(param_temp2, &param_temp3);
-
 #ifdef DISABLE_CONV_SUM_FUSION
-  param_compiled->CopyFrom(param_temp3);
+  param_compiled->CopyFrom(param_temp2);
   param_compiled->clear_layer();    // Remove layers
-  CompilationRuleThree(param_temp3, param_compiled);
+  CompilationRuleThree(param_temp2, param_compiled);
 #else
-  NetParameter param_temp4;
-  param_temp4.CopyFrom(param_temp3);
-  param_temp4.clear_layer();
-  CompilationRuleThree(param_temp3, &param_temp4);
+  NetParameter param_temp3;
+  param_temp3.CopyFrom(param_temp2);
+  param_temp3.clear_layer();
+  CompilationRuleThree(param_temp2, &param_temp3);
 
-  param_compiled->CopyFrom(param_temp4);
+  param_compiled->CopyFrom(param_temp3);
   param_compiled->clear_layer();
-  CompilationRuleFour(param_temp4, param_compiled);
+  CompilationRuleFour(param_temp3, param_compiled);
 #endif 
 }
 
@@ -957,94 +952,6 @@ void Net<Dtype>::CompilationRuleFour(const NetParameter& param,
   return;
 }
 
-template <typename Dtype>
-void Net<Dtype>::CompilationRuleFuseBnRelu(const NetParameter& param,
-                                    NetParameter* param_compiled) {
-
-  std::set<std::string> layers_to_drop;
-  for (int i = 0; i < param.layer_size(); ++i) {
-    LayerParameter* layer_param =
-          (const_cast<NetParameter&>(param)).mutable_layer(i);
-    bool layer_included = true;
-
-    // Optimization rule BnRelu:
-    // - If we are having engine MKLDNN and Relu layer within a model
-    // and input bottom comes from  BatchNorm of engine MKLDNN
-    // then we can remove Relu layer
-    // and rename BatchNorm top blob after deleted Relu's top
-    // If current layer is BatchNorm of MKLDNN engine..
-    if (((layer_param->type().compare("BatchNorm") == 0) &&
-         ((layer_param->batch_norm_param().engine() == BatchNormParameter_Engine_MKLDNN) ||
-          ((layer_param->batch_norm_param().engine() == BatchNormParameter_Engine_DEFAULT) &&
-           (layer_param->has_engine() == false)  &&
-           (param.engine().compare("MKLDNN") == 0)) ||
-          (param.engine() == "" && layer_param->engine().compare("MKLDNN") == 0)))) {
-      std::vector<const LayerParameter*> consumer_layer_params;
-      GetBlobConsumers(consumer_layer_params,
-                       layer_param->top(0),
-                       param,
-                       i+1 < param.layer_size() ? i+1 : i);
-      const LayerParameter& consumer_layer_param =
-                                    consumer_layer_params.size() > 0 ?
-                                    *(consumer_layer_params[0]) : *layer_param;
-      // Consumer layer of blob produced by BN
-      // has to be Relu layer with one Input Blob
-
-      if ((consumer_layer_param.type().compare("ReLU") == 0) &&
-          ((consumer_layer_param.relu_param().engine() == ReLUParameter_Engine_MKLDNN) ||
-           ((consumer_layer_param.relu_param().engine() == ReLUParameter_Engine_DEFAULT) &&
-            (consumer_layer_param.engine().compare(0, 6, "MKLDNN") == 0 &&
-             consumer_layer_param.engine().find(":DLA", 6) == string::npos)) ||
-           ((consumer_layer_param.relu_param().engine() == ReLUParameter_Engine_DEFAULT) &&
-            (consumer_layer_param.engine() == "") &&
-            (param.engine().compare(0, 6, "MKLDNN") == 0 &&
-             param.engine().find(":DLA", 6) == string::npos))) &&
-             !consumer_layer_param.relu_param().negative_slope()) {
-             // negative_slope should be zero
-        string& batchnorm_top_blob_name =
-            const_cast<string&>(layer_param->top(0));
-
-        if(param.state().phase() == TEST) {
-          const string& relu_top_blob_name = consumer_layer_param.top(0);
-          // Mark Consumer layer (its name) as the one marked for dropping
-          layers_to_drop.insert(consumer_layer_param.name());
-
-          // Replace BatchNorm top name with ReLU top name
-          batchnorm_top_blob_name.resize(relu_top_blob_name.size());
-          batchnorm_top_blob_name.replace(0,
-                                          relu_top_blob_name.size(),
-                                          relu_top_blob_name);
-        }
-        // set relu flag in BN
-        layer_param->mutable_batch_norm_param()->set_relu(true);
-
-        if(param.state().phase() == TRAIN) {
-          if(i+1 < param.layer_size()) {
-            LayerParameter* relu_layer_param =
-              (const_cast<NetParameter&>(param)).mutable_layer(i+1);
-            relu_layer_param->mutable_relu_param()->set_fuse(true);
-            // LOG(INFO) <<  "Bn + Relu fused." << std::endl;
-          }
-        }
-      }
-    }
-
-    if(param.state().phase() == TEST) {
-      if (layers_to_drop.find(layer_param->name()) != layers_to_drop.end()) {
-        LOG_IF(INFO, Caffe::root_solver()) << "Dropped layer: "
-               << layer_param->name() << std::endl;
-        layer_included = false;
-        // Remove dropped layer from the list of layers to be dropped
-        layers_to_drop.erase(layers_to_drop.find(layer_param->name()));
-      }
-    }
-
-    if (layer_included) {
-      param_compiled->add_layer()->CopyFrom(*layer_param);
-    }
-  }
-}
-
 template <typename Dtype>
 void Net<Dtype>::GetBlobConsumers(
                   std::vector<const LayerParameter*>& consumer_blobs,
diff --git a/src/caffe/proto/caffe.proto b/src/caffe/proto/caffe.proto
index ea69365d7..439415c26 100755
--- a/src/caffe/proto/caffe.proto
+++ b/src/caffe/proto/caffe.proto
@@ -933,7 +933,6 @@ message BatchNormParameter {
   optional FillerParameter bias_filler = 8; // The filler for the bias
   // Batch size used for statistics, 0 would use the batch size of bottom blob
   optional uint32 stats_batch_size = 9 [default = 0];
-  optional bool relu = 10 [default = false];
 }
 
 message SplitParameter {

From 694a1d7323e9944aefcf7c05af0569ecb9ce60b5 Mon Sep 17 00:00:00 2001
From: Haihao Shen <haihao.shen@intel.com>
Date: Fri, 22 Dec 2017 13:31:47 +0800
Subject: [PATCH 19/53] Enable performance monitor with event reset to avoid
 data variance during warmup iterations

---
 include/caffe/util/performance.hpp | 21 +++++++++++++++++++--
 tools/caffe.cpp                    |  4 ++++
 2 files changed, 23 insertions(+), 2 deletions(-)

diff --git a/include/caffe/util/performance.hpp b/include/caffe/util/performance.hpp
index 9b9bd0657..28b3e512b 100644
--- a/include/caffe/util/performance.hpp
+++ b/include/caffe/util/performance.hpp
@@ -77,6 +77,12 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
   performance::monitor.EnableMeasurements(); \
   performance::monitor.MarkAsInitialized();
 
+#define PERFORMANCE_START_RESETTING_MONITOR() \
+  performance::monitor.StartResetting();
+
+#define PERFORMANCE_STOP_RESETTING_MONITOR() \
+  performance::monitor.StopResetting();
+
 #define PERFORMANCE_MEASUREMENT_END_MKL(prefix)       \
   do {                                                \
     static char name[256];                            \
@@ -117,6 +123,8 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 #define PERFORMANCE_MEASUREMENT_END_ID(id_name)
 #define PERFORMANCE_CREATE_MONITOR()
 #define PERFORMANCE_INIT_MONITOR()
+#define PERFORMANCE_START_RESETTING_MONITOR()
+#define PERFORMANCE_STOP_RESETTING_MONITOR()
 #define PERFORMANCE_MEASUREMENT_END_MKL(prefix)
 #define PERFORMANCE_MEASUREMENT_END_MKL_DETAILED(prefix, suffix)
 #define PERFORMANCE_MKL_NAME_DETAILED(prefix, suffix)
@@ -426,6 +434,7 @@ namespace performance {
     Map event_name_id_map_;
 
     bool are_measurements_enabled_;
+    bool resetting_;
 
     NameVector event_names_;
     PreciseTime total_non_mkl_time_;
@@ -579,6 +588,7 @@ namespace performance {
 
    public:
     Monitor() {
+      resetting_ = false;
       events_.reserve(64);
 
       PreciseTime::Calibrate();
@@ -607,6 +617,9 @@ namespace performance {
       total_init_time_ = PreciseTime::GetProcessTime() - total_process_time_;
     }
 
+    void StartResetting() { resetting_ = true; }
+    void StopResetting() { resetting_ = false; }
+
     unsigned GetEventIdByName(const char *event_name) {
       if (!are_measurements_enabled_)
         return PERFORMANCE_EVENT_ID_UNSET;
@@ -622,8 +635,12 @@ namespace performance {
     }
 
     void UpdateEventById(unsigned event_id, const Measurement &measurement) {
-      if (are_measurements_enabled_)
-        events_[event_id].Update(measurement);
+      if (are_measurements_enabled_) {
+        if (resetting_)
+          events_[event_id] = Event();
+        else
+          events_[event_id].Update(measurement);
+      }
     }
   };
 
diff --git a/tools/caffe.cpp b/tools/caffe.cpp
index 0373794c3..8d78338d9 100644
--- a/tools/caffe.cpp
+++ b/tools/caffe.cpp
@@ -565,6 +565,8 @@ int time() {
   // have huge variance in some machines.
   int warmup_iterations = 5;
   for (int j = 0; j < warmup_iterations; ++j) {
+    if (j == warmup_iterations - 1)
+      PERFORMANCE_START_RESETTING_MONITOR();
     for (int i = 0; i < layers.size(); ++i) {
       layers[i]->Forward(bottom_vecs[i], top_vecs[i]);
     }
@@ -576,6 +578,8 @@ int time() {
     }
   }
 
+  PERFORMANCE_STOP_RESETTING_MONITOR();
+
   LOG(INFO) << "*** Benchmark begins ***";
   LOG(INFO) << "Testing for " << FLAGS_iterations << " iterations.";
   Timer total_timer;

From 5ae4cf4df2220893cc4d516df9d1044a9bc90074 Mon Sep 17 00:00:00 2001
From: fzou1 <feng.zou@intel.com>
Date: Thu, 21 Dec 2017 18:35:07 +0800
Subject: [PATCH 20/53] add vgg16 topology files with 2k and 4k; fix crash
 issue of pycaffe; use last 2 virtual cores for internal thread, instead of
 reserving 2 physcial cores; support all cpu models for knl/skx/bdw and also
 support cpu model specified in command; change default multinode settings to
 bdw/skx (NO of MLSL ep server=2, run caffe binary directly if cpu is unknown"

Change-Id: Ieb51e5fa9e5333d9834631fb53f81d3faccc1704
---
 .../vgg_16_32nodes_2k_batch/solver.prototxt   |  19 +
 .../train_val.prototxt                        | 613 ++++++++++++++++++
 .../vgg_16_64nodes_4k_batch/solver.prototxt   |  19 +
 .../train_val.prototxt                        | 613 ++++++++++++++++++
 python/caffe/_caffe.cpp                       |  42 ++
 scripts/run_benchmark.sh                      |  31 +-
 scripts/run_intelcaffe.sh                     |  69 +-
 scripts/set_env.sh                            |  21 +-
 8 files changed, 1380 insertions(+), 47 deletions(-)
 create mode 100644 models/intel_optimized_models/multinode/vgg_16_32nodes_2k_batch/solver.prototxt
 create mode 100644 models/intel_optimized_models/multinode/vgg_16_32nodes_2k_batch/train_val.prototxt
 create mode 100644 models/intel_optimized_models/multinode/vgg_16_64nodes_4k_batch/solver.prototxt
 create mode 100644 models/intel_optimized_models/multinode/vgg_16_64nodes_4k_batch/train_val.prototxt

diff --git a/models/intel_optimized_models/multinode/vgg_16_32nodes_2k_batch/solver.prototxt b/models/intel_optimized_models/multinode/vgg_16_32nodes_2k_batch/solver.prototxt
new file mode 100644
index 000000000..e6ef942f4
--- /dev/null
+++ b/models/intel_optimized_models/multinode/vgg_16_32nodes_2k_batch/solver.prototxt
@@ -0,0 +1,19 @@
+net: "models/intel_optimized_models/multinode/vgg_16_32nodes_2k_batch/train_val.prototxt"
+test_iter: 1000
+test_interval: 1000
+momentum: 0.9
+weight_decay: 0.0005
+power: 2
+base_lr: 7
+warmup_start_lr: 1
+warmup_iter: 3127 # 5 epochs
+local_lr_auto: true
+local_gw_ratio: 0.001
+
+lr_policy: "poly"
+gamma: 0.1
+max_iter: 40000
+display: 20
+snapshot: 5000
+solver_mode: CPU
+snapshot_prefix: "vgg_16_32nodes_2k_batch"
diff --git a/models/intel_optimized_models/multinode/vgg_16_32nodes_2k_batch/train_val.prototxt b/models/intel_optimized_models/multinode/vgg_16_32nodes_2k_batch/train_val.prototxt
new file mode 100644
index 000000000..046166772
--- /dev/null
+++ b/models/intel_optimized_models/multinode/vgg_16_32nodes_2k_batch/train_val.prototxt
@@ -0,0 +1,613 @@
+name: "VGG_ILSVRC_16_layer"
+layer {
+  name: "data"
+  type: "Data"
+  include {
+    phase: TRAIN
+  }
+ transform_param {
+    crop_size: 224
+    mean_value: 104
+    mean_value: 117
+    mean_value: 124
+    mirror: true
+ }
+ data_param {
+    source: "examples/imagenet/ilsvrc12_train_lmdb"
+    batch_size: 64
+    backend: LMDB
+    shuffle: true
+  }
+  top: "data"
+  top: "label"
+}
+layer {
+  name: "data"
+  type: "Data"
+  include {
+    phase: TEST
+  }
+ transform_param {
+    crop_size: 224
+    mean_value: 104
+    mean_value: 117
+    mean_value: 124
+    mirror: false
+ }
+ data_param {
+    source: "examples/imagenet/ilsvrc12_val_lmdb"
+    batch_size: 50
+    backend: LMDB
+  }
+  top: "data"
+  top: "label"
+}
+layer {
+   name: "conv1_1"
+  type: "Convolution"
+  bottom: "data"
+  top: "conv1_1"
+ convolution_param {
+    
+    num_output: 64
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+
+  
+}
+layer {
+  bottom: "conv1_1"
+  top: "conv1_1"
+  name: "relu1_1"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv1_1"
+  top: "conv1_2"
+  name: "conv1_2"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 64
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv1_2"
+  top: "conv1_2"
+  name: "relu1_2"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv1_2"
+  top: "pool1"
+  name: "pool1"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  bottom: "pool1"
+  top: "conv2_1"
+  name: "conv2_1"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 128
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv2_1"
+  top: "conv2_1"
+  name: "relu2_1"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv2_1"
+  top: "conv2_2"
+  name: "conv2_2"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 128
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv2_2"
+  top: "conv2_2"
+  name: "relu2_2"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv2_2"
+  top: "pool2"
+  name: "pool2"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  bottom: "pool2"
+  top: "conv3_1"
+  name: "conv3_1"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv3_1"
+  top: "conv3_1"
+  name: "relu3_1"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv3_1"
+  top: "conv3_2"
+  name: "conv3_2"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv3_2"
+  top: "conv3_2"
+  name: "relu3_2"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv3_2"
+  top: "conv3_3"
+  name: "conv3_3"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv3_3"
+  top: "conv3_3"
+  name: "relu3_3"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv3_3"
+  top: "pool3"
+  name: "pool3"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  bottom: "pool3"
+  top: "conv4_1"
+  name: "conv4_1"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv4_1"
+  top: "conv4_1"
+  name: "relu4_1"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv4_1"
+  top: "conv4_2"
+  name: "conv4_2"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv4_2"
+  top: "conv4_2"
+  name: "relu4_2"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv4_2"
+  top: "conv4_3"
+  name: "conv4_3"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv4_3"
+  top: "conv4_3"
+  name: "relu4_3"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv4_3"
+  top: "pool4"
+  name: "pool4"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  bottom: "pool4"
+  top: "conv5_1"
+  name: "conv5_1"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv5_1"
+  top: "conv5_1"
+  name: "relu5_1"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv5_1"
+  top: "conv5_2"
+  name: "conv5_2"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv5_2"
+  top: "conv5_2"
+  name: "relu5_2"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv5_2"
+  top: "conv5_3"
+  name: "conv5_3"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0.0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv5_3"
+  top: "conv5_3"
+  name: "relu5_3"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv5_3"
+  top: "pool5"
+  name: "pool5"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  bottom: "pool5"
+  top: "fc6"
+  name: "fc6"
+  type: "InnerProduct"
+  inner_product_param {
+    num_output: 4096
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0.1
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "fc6"
+  top: "fc6"
+  name: "relu6"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "fc6"
+  top: "fc6"
+  name: "drop6"
+  type: "Dropout"
+  dropout_param {
+    dropout_ratio: 0.5
+  }
+}
+layer {
+  bottom: "fc6"
+  top: "fc7"
+  name: "fc7"
+  type: "InnerProduct"
+  inner_product_param {
+    num_output: 4096
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0.1
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "fc7"
+  top: "fc7"
+  name: "relu7"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "fc7"
+  top: "fc7"
+  name: "drop7"
+  type: "Dropout"
+  dropout_param {
+    dropout_ratio: 0.5
+  }
+}
+layer {
+  name: "fc8"
+  bottom: "fc7"
+  top: "fc8"
+  type: "InnerProduct"
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0.1
+    }
+  }
+ 
+ 
+}
+layer {
+  name: "loss"
+  type: "SoftmaxWithLoss"
+  bottom: "fc8"
+  bottom: "label"
+  top: "loss/loss"
+}
+layer {
+  name: "accuracy/top1"
+  type: "Accuracy"
+  bottom: "fc8"
+  bottom: "label"
+  top: "accuracy@1"
+  include: { phase: TEST }
+  accuracy_param {
+    top_k: 1
+  }
+}
+layer {
+  name: "accuracy/top5"
+  type: "Accuracy"
+  bottom: "fc8"
+  bottom: "label"
+  top: "accuracy@5"
+  include: { phase: TEST }
+  accuracy_param {
+    top_k: 5
+  }
+}
diff --git a/models/intel_optimized_models/multinode/vgg_16_64nodes_4k_batch/solver.prototxt b/models/intel_optimized_models/multinode/vgg_16_64nodes_4k_batch/solver.prototxt
new file mode 100644
index 000000000..23c27d292
--- /dev/null
+++ b/models/intel_optimized_models/multinode/vgg_16_64nodes_4k_batch/solver.prototxt
@@ -0,0 +1,19 @@
+net: "models/intel_optimized_models/multinode/vgg_16_64nodes_4k_batch/train_val.prototxt"
+test_iter: 1000
+test_interval: 1000
+momentum: 0.9
+weight_decay: 0.0005
+power: 2
+base_lr: 14
+warmup_start_lr: 1
+warmup_iter: 1564  # 5 epochs
+local_lr_auto: true
+local_gw_ratio: 0.001
+
+lr_policy: "poly"
+gamma: 0.1
+max_iter: 20000
+display: 20
+snapshot: 5000
+solver_mode: CPU
+snapshot_prefix: "vgg_16_64nodes_4k_batch"
diff --git a/models/intel_optimized_models/multinode/vgg_16_64nodes_4k_batch/train_val.prototxt b/models/intel_optimized_models/multinode/vgg_16_64nodes_4k_batch/train_val.prototxt
new file mode 100644
index 000000000..046166772
--- /dev/null
+++ b/models/intel_optimized_models/multinode/vgg_16_64nodes_4k_batch/train_val.prototxt
@@ -0,0 +1,613 @@
+name: "VGG_ILSVRC_16_layer"
+layer {
+  name: "data"
+  type: "Data"
+  include {
+    phase: TRAIN
+  }
+ transform_param {
+    crop_size: 224
+    mean_value: 104
+    mean_value: 117
+    mean_value: 124
+    mirror: true
+ }
+ data_param {
+    source: "examples/imagenet/ilsvrc12_train_lmdb"
+    batch_size: 64
+    backend: LMDB
+    shuffle: true
+  }
+  top: "data"
+  top: "label"
+}
+layer {
+  name: "data"
+  type: "Data"
+  include {
+    phase: TEST
+  }
+ transform_param {
+    crop_size: 224
+    mean_value: 104
+    mean_value: 117
+    mean_value: 124
+    mirror: false
+ }
+ data_param {
+    source: "examples/imagenet/ilsvrc12_val_lmdb"
+    batch_size: 50
+    backend: LMDB
+  }
+  top: "data"
+  top: "label"
+}
+layer {
+   name: "conv1_1"
+  type: "Convolution"
+  bottom: "data"
+  top: "conv1_1"
+ convolution_param {
+    
+    num_output: 64
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+
+  
+}
+layer {
+  bottom: "conv1_1"
+  top: "conv1_1"
+  name: "relu1_1"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv1_1"
+  top: "conv1_2"
+  name: "conv1_2"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 64
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv1_2"
+  top: "conv1_2"
+  name: "relu1_2"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv1_2"
+  top: "pool1"
+  name: "pool1"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  bottom: "pool1"
+  top: "conv2_1"
+  name: "conv2_1"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 128
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv2_1"
+  top: "conv2_1"
+  name: "relu2_1"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv2_1"
+  top: "conv2_2"
+  name: "conv2_2"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 128
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv2_2"
+  top: "conv2_2"
+  name: "relu2_2"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv2_2"
+  top: "pool2"
+  name: "pool2"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  bottom: "pool2"
+  top: "conv3_1"
+  name: "conv3_1"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv3_1"
+  top: "conv3_1"
+  name: "relu3_1"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv3_1"
+  top: "conv3_2"
+  name: "conv3_2"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv3_2"
+  top: "conv3_2"
+  name: "relu3_2"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv3_2"
+  top: "conv3_3"
+  name: "conv3_3"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv3_3"
+  top: "conv3_3"
+  name: "relu3_3"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv3_3"
+  top: "pool3"
+  name: "pool3"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  bottom: "pool3"
+  top: "conv4_1"
+  name: "conv4_1"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv4_1"
+  top: "conv4_1"
+  name: "relu4_1"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv4_1"
+  top: "conv4_2"
+  name: "conv4_2"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv4_2"
+  top: "conv4_2"
+  name: "relu4_2"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv4_2"
+  top: "conv4_3"
+  name: "conv4_3"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv4_3"
+  top: "conv4_3"
+  name: "relu4_3"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv4_3"
+  top: "pool4"
+  name: "pool4"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  bottom: "pool4"
+  top: "conv5_1"
+  name: "conv5_1"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv5_1"
+  top: "conv5_1"
+  name: "relu5_1"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv5_1"
+  top: "conv5_2"
+  name: "conv5_2"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv5_2"
+  top: "conv5_2"
+  name: "relu5_2"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv5_2"
+  top: "conv5_3"
+  name: "conv5_3"
+  type: "Convolution"
+  convolution_param {
+    
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0.0
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "conv5_3"
+  top: "conv5_3"
+  name: "relu5_3"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv5_3"
+  top: "pool5"
+  name: "pool5"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  bottom: "pool5"
+  top: "fc6"
+  name: "fc6"
+  type: "InnerProduct"
+  inner_product_param {
+    num_output: 4096
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0.1
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "fc6"
+  top: "fc6"
+  name: "relu6"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "fc6"
+  top: "fc6"
+  name: "drop6"
+  type: "Dropout"
+  dropout_param {
+    dropout_ratio: 0.5
+  }
+}
+layer {
+  bottom: "fc6"
+  top: "fc7"
+  name: "fc7"
+  type: "InnerProduct"
+  inner_product_param {
+    num_output: 4096
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0.1
+    }
+  }
+ 
+ 
+}
+layer {
+  bottom: "fc7"
+  top: "fc7"
+  name: "relu7"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "fc7"
+  top: "fc7"
+  name: "drop7"
+  type: "Dropout"
+  dropout_param {
+    dropout_ratio: 0.5
+  }
+}
+layer {
+  name: "fc8"
+  bottom: "fc7"
+  top: "fc8"
+  type: "InnerProduct"
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+        type: "xavier"
+    }
+    bias_filler {
+        type: "constant"
+        value: 0.1
+    }
+  }
+ 
+ 
+}
+layer {
+  name: "loss"
+  type: "SoftmaxWithLoss"
+  bottom: "fc8"
+  bottom: "label"
+  top: "loss/loss"
+}
+layer {
+  name: "accuracy/top1"
+  type: "Accuracy"
+  bottom: "fc8"
+  bottom: "label"
+  top: "accuracy@1"
+  include: { phase: TEST }
+  accuracy_param {
+    top_k: 1
+  }
+}
+layer {
+  name: "accuracy/top5"
+  type: "Accuracy"
+  bottom: "fc8"
+  bottom: "label"
+  top: "accuracy@5"
+  include: { phase: TEST }
+  accuracy_param {
+    top_k: 5
+  }
+}
diff --git a/python/caffe/_caffe.cpp b/python/caffe/_caffe.cpp
index afafe71d8..533c67295 100644
--- a/python/caffe/_caffe.cpp
+++ b/python/caffe/_caffe.cpp
@@ -57,6 +57,10 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 #include "caffe/layers/python_layer.hpp"
 #include "caffe/sgd_solvers.hpp"
 
+#ifdef USE_MLSL
+#include "caffe/multinode/mlsl.hpp"
+#endif
+
 // Temporary solution for numpy < 1.7 versions: old macro, no promises.
 // You're strongly advised to upgrade to >= 1.7.
 #ifndef NPY_ARRAY_C_CONTIGUOUS
@@ -89,6 +93,37 @@ const int NPY_DTYPE = NPY_FLOAT32;
 void set_mode_cpu() { Caffe::set_mode(Caffe::CPU); }
 void set_mode_gpu() { Caffe::set_mode(Caffe::GPU); }
 
+#ifdef USE_MLSL
+void InitMultinode() {
+  int argc = 0;
+  char **argv = NULL;
+  mn::init(&argc, &argv);
+}
+#endif
+
+int NodeId() {
+#if USE_MLSL
+  return mn::get_node_id();
+#else
+  return 0;
+#endif
+}
+
+int NumNodes() {
+#if USE_MLSL
+  return mn::get_nodes_count();
+#else
+  return 1;
+#endif
+}
+
+void Barrier() {
+#if USE_MLSL
+  mn::Distribution * distrib = mn::get_distrib();
+  distrib->barrier<MLSL::GT_DATA>();
+#endif
+}
+
 void InitLog() {
   ::google::InitGoogleLogging("");
   ::google::InstallFailureSignalHandler();
@@ -344,6 +379,13 @@ BOOST_PYTHON_MODULE(_caffe) {
 
   bp::scope().attr("__version__") = AS_STRING(CAFFE_VERSION);
 
+#ifdef USE_MLSL
+  InitMultinode();
+#endif
+  bp::def("_node_id", &NodeId);
+  bp::def("_num_nodes", &NumNodes);
+  bp::def("_barrier", &Barrier);
+
   // Caffe utility functions
   bp::def("init_log", &InitLog);
   bp::def("init_log", &InitLogLevel);
diff --git a/scripts/run_benchmark.sh b/scripts/run_benchmark.sh
index c03fe50c3..9ee320236 100755
--- a/scripts/run_benchmark.sh
+++ b/scripts/run_benchmark.sh
@@ -90,20 +90,27 @@ function calculate_numnodes
 
 function detect_cpu
 {
+    # detect cpu model
     model_string=`lscpu | grep "Model name" | awk -F ':' '{print $2}'`
-    if [[ $model_string == *"7235"* ]] || [[ $model_string == *"7285"* ]] || [[ $model_string == *"7295"* ]]; then
-        cpu_model="knm"
-    elif [[ $model_string == *"72"* ]]; then
-        cpu_model="knl"
-    elif [[ $model_string == *"8180"* ]] || [[ $model_string == *"8124"* ]]; then
-        cpu_model="skx"
-    elif [[ $model_string == *"6148"* ]]; then
-        cpu_model="skx"
-    elif [[ $model_string == *"E5-26"* ]]; then
-        cpu_model="bdw"
+    if [[ $model_string == *"Phi"* ]]; then
+        if [[ $model_string =~ 72(1|3|5|9)0 ]]; then
+            cpu_model="knl"
+        elif [[ $model_string == *"72"* ]]; then
+            cpu_model="knm"
+        else
+            unknown_cpu=1
+            echo "Can't detect which cpu model currently using, will use default settings, which may not be the optimal one."
+        fi
     else
-        unknown_cpu=1
-        echo "Can't detect which cpu model currently using, will use default settings, which may not be the optimal one."
+        model_num=`echo $model_string | awk '{print $4}'`
+        if [[ $model_num =~ ^[8|6|5|4|3]1 ]]; then
+            cpu_model="skx"
+        elif [[ $model_num =~ ^E5-[4|2|1]6|^E7-[8|4]8|^E3-12|^D[-]?15 ]]; then
+            cpu_model="bdw"
+        else
+            unknown_cpu=1
+            echo "Can't detect which cpu model currently using, will use default settings, which may not be the optimal one."
+        fi
     fi
 }
 
diff --git a/scripts/run_intelcaffe.sh b/scripts/run_intelcaffe.sh
index 27e90cef7..1761f6e92 100755
--- a/scripts/run_intelcaffe.sh
+++ b/scripts/run_intelcaffe.sh
@@ -10,7 +10,7 @@ numnodes=1
 mode="train"
 
 # it's assigned by detect_cpu
-cpu_model="skx"
+cpu_model=""
 
 # a list of nodes
 host_file=""
@@ -72,6 +72,7 @@ function usage
     echo "               [--mpibench_bin mpibench_bin]"
     echo "               [--mpibench_param mpibench_param]"
     echo "               [--caffe_bin  caffe_binary_path]"
+    echo "               [--cpu cpu_model]"
     echo ""
     echo "  Parameters:"
     echo "    hostfile: host file includes list of nodes. Only used if you're running with multinode"
@@ -93,30 +94,42 @@ function usage
     echo "    mpibench_bin: IMB-MPI1 (default). relative path of binary of mpi benchmark."
     echo "    mpibench_param: allreduce (default). parameter of mpi benchmark."
     echo "    caffe_binary_path: path of caffe binary."
+    echo "    cpu_model: specify cpu model and use the optimal settings if the CPU is not"
+    echo "               included in supported list. Value: bdw, knl, skx and knm."
+    echo "               bdw - Broadwell, knl - Knights Landing, skx - Skylake,"
+    echo "               knm - Knights Mill."
     echo ""
 }
 
-declare -a cpu_list=("Intel Xeon E5-26xx (Broadwell)" "Intel Xeon Phi 72xx (Knights Landing)" 
-                     "Intel Xeon Platinum 8180 (Skylake)" "Intel Xeon 6148 (Skylake)")
+declare -a cpu_list=("Intel Xeon E7-88/48xx, E5-46/26/16xx, E3-12xx, D15/D-15 (Broadwell)"
+                     "Intel Xeon Phi 7210/30/50/90 (Knights Landing)" 
+                     "Intel Xeon Platinum 81/61/51/41/31xx (Skylake)")
 
 function detect_cpu
 {
     # detect cpu model
     model_string=`lscpu | grep "Model name" | awk -F ':' '{print $2}'`
-    if [[ $model_string == *"7235"* ]] || [[ $model_string == *"7285"* ]] || [[ $model_string == *"7295"* ]]; then
-        cpu_model="knm"
-    elif [[ $model_string == *"72"* ]]; then
-        cpu_model="knl"
-    elif [[ $model_string == *"8180"* ]] || [[ $model_string == *"8124"* ]]; then
-        cpu_model="skx"
-    elif [[ $model_string == *"6148"* ]]; then
-        cpu_model="skx"
-    elif [[ $model_string == *"E5-26"* ]]; then
-        cpu_model="bdw"
+    if [[ $model_string == *"Phi"* ]]; then
+        if [[ $model_string =~ 72(1|3|5|9)0 ]]; then
+            cpu_model="knl"
+        elif [[ $model_string == *"72"* ]]; then
+            cpu_model="knm"
+        else
+            cpu_model="unknown"
+            echo "CPU model :$model_string is unknown."
+            echo "    Use default settings, which may not be the optimal one."
+        fi
     else
-        cpu_model="unknown"
-        echo "CPU model :$model_string is unknown."
-        echo "    Use default settings, which may not be the optimal one."
+        model_num=`echo $model_string | awk '{print $4}'`
+        if [[ $model_num =~ ^[8|6|5|4|3]1 ]]; then
+            cpu_model="skx"
+        elif [[ $model_num =~ ^E5-[4|2|1]6|^E7-[8|4]8|^E3-12|^D[-]?15 ]]; then
+            cpu_model="bdw"
+        else
+            cpu_model="unknown"
+            echo "CPU model :$model_string is unknown."
+            echo "    Use default settings, which may not be the optimal one."
+        fi
     fi
 }
 
@@ -130,11 +143,11 @@ function set_numa_node
     # detect numa mode: cache and flat mode for KNL
     numa_node=($(numactl -H | grep "available" | awk -F ' ' '{print $2}'))
     if [ $numa_node -eq 1 ]; then
-        echo "Cache mode."
+        echo "    NUMA configuration: Cache mode."
         # cache mode, use numa node 0
         numanode=0
     else
-        echo "Flat mode."
+        echo "    NUMA configuration: Flat mode."
         numanode=1
     fi
 }
@@ -157,12 +170,12 @@ function execute_command
     local xeonbin_=$1
     local result_dir_=$2
 
-    if [ "${cpu_model}" == "bdw" ]; then
-        exec_command="$xeonbin_"
-    elif [ "${cpu_model}" == "skx" ]; then
+    if [ "${cpu_model}" == "skx" ]; then
         exec_command="numactl -l $xeonbin_"
-    else
+    elif [ "${cpu_model}" == "knl" ] || [ "${cpu_model}" == "knm" ]; then
         exec_command="numactl --preferred=$numanode $xeonbin_"
+    else
+        exec_command="$xeonbin_"
     fi
 
     if [ ${numnodes} -gt 1 ]; then
@@ -487,6 +500,10 @@ do
             caffe_bin=$2
             shift
             ;;
+        --cpu)
+            cpu_model=$2
+            shift
+            ;;
         *)
             echo "Unknown option: $key"
             usage
@@ -496,14 +513,18 @@ do
     shift
 done
 
-detect_cpu
-
 echo ""
 echo "CPUs with optimal settings:"
 for ((i=0; i<${#cpu_list[@]}; i++))
 do
     echo "    ${cpu_list[$i]}"
 done
+
+# if cpu model is not specified in command, detect cpu model by "lscpu" command
+if [ "$cpu_model" == "" ]; then
+    detect_cpu
+fi
+
 echo ""
 echo "Settings:"
 echo "    CPU: $cpu_model"
diff --git a/scripts/set_env.sh b/scripts/set_env.sh
index e2816aa5a..9d7ca6013 100755
--- a/scripts/set_env.sh
+++ b/scripts/set_env.sh
@@ -118,10 +118,10 @@ function set_mlsl_vars
     fi
 
     if [ ${num_mlsl_servers} -eq -1 ]; then
-        if [ "${cpu_model}" == "bdw" ] || [ "${cpu_model}" == "skx" ]; then
-            numservers=2
-        else
+        if [ "${cpu_model}" == "knl" ] || [ "${cpu_model}" == "knm" ]; then
             numservers=4
+        else
+            numservers=2
         fi
     else
         numservers=$((num_mlsl_servers))
@@ -131,10 +131,10 @@ function set_mlsl_vars
     export MLSL_NUM_SERVERS=${numservers}
 
     if [ ${numservers} -gt 0 ]; then
-        if [ "${cpu_model}" == "bdw" ] || [ "${cpu_model}" == "skx" ]; then
+        if [ "${cpu_model}" == "knl" ] || [ "${cpu_model}" == "knm" ]; then
             listep=6,7,8,9
         else
-            listep=6,7,8,9,10,11,12,13
+            listep=6,7
         fi
         export MLSL_SERVER_AFFINITY="${listep}"
         echo "MLSL_SERVER_AFFINITY: ${listep}"
@@ -153,17 +153,16 @@ function set_openmp_envs
     ppncpu=1
     threadspercore=1
 
+    cpus=`lscpu | grep "^CPU(s):" | awk '{print $2}'`
     cores=`lscpu | grep "Core(s) per socket:" | awk '{print $4}'`
     sockets=`lscpu | grep "Socket(s)" | awk  '{print $2}'`
     maxcores=$((cores*sockets))
 
     if [ "$internal_thread_pin" == "on" ]; then
-        num_internal_threads=2
-        export INTERNAL_THREADS_PIN=$((maxcores-2)),$((maxcores-1))
-    else
-        num_internal_threads=0
+        export INTERNAL_THREADS_PIN=$((cpus-2)),$((cpus-1))
+        echo "Pin internal threads to: $INTERNAL_THREADS_PIN"
     fi
-    numthreads=$(((maxcores-numservers-num_internal_threads)*threadspercore))
+    numthreads=$(((maxcores-numservers)*threadspercore))
     numthreads_per_proc=$((numthreads/ppncpu))
 
     # OMP configuration
@@ -183,7 +182,7 @@ function set_openmp_envs
 
         export OMP_NUM_THREADS=${numthreads_per_proc}
         export KMP_HW_SUBSET=1t
-        affinitystr="proclist=[0-5,$((5+numservers+reserved_cores+1))-$((maxcores-1-num_internal_threads))],granularity=thread,explicit"
+        affinitystr="proclist=[0-5,$((5+numservers+reserved_cores+1))-$((maxcores-1))],granularity=thread,explicit"
         export KMP_AFFINITY=$affinitystr
     else
         # For single node only set for KNM

From 5b6bbf7861372f05509bb26de11ca07208dfbba3 Mon Sep 17 00:00:00 2001
From: Feng Tian <feng.tian@intel.com>
Date: Mon, 25 Dec 2017 10:52:05 +0800
Subject: [PATCH 21/53] Fix two issues existed in mkldnn conv and relue layers.

1. If mkldnn conv is followed by a caffe layer and conversion is needed,
   the problem will be triggered that the prv_data of bwdw_top_diff is
   pointing to a full 0 buffer as no conversion happened according to
   current logic.

2. If a caffe layer is before mkldnn relu layer, the problem will be
   triggered that the mkldnn bwd primitive is using bottom's cpu_data
   and top's prv_diff to do calculation.

Change-Id: Ia1eb2a42c492603ce4f336ee09892c9bebe8687c
---
 include/caffe/layers/mkldnn_layers.hpp        |  4 ++--
 src/caffe/layers/mkldnn_convolution_layer.cpp |  9 ++++++++
 .../layers/mkldnn_inner_product_layer.cpp     |  8 +++++++
 src/caffe/layers/mkldnn_relu_layer.cpp        | 22 ++++++++++++++++++-
 src/caffe/mkldnn_memory.cpp                   |  2 +-
 5 files changed, 41 insertions(+), 4 deletions(-)

diff --git a/include/caffe/layers/mkldnn_layers.hpp b/include/caffe/layers/mkldnn_layers.hpp
index 19bcee9da..cde342b30 100644
--- a/include/caffe/layers/mkldnn_layers.hpp
+++ b/include/caffe/layers/mkldnn_layers.hpp
@@ -387,13 +387,13 @@ class MKLDNNReLULayer : public MKLDNNLayer<Dtype> , public NeuronLayer<Dtype>  {
     void InitReLUBwd(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down
                                 , const vector<Blob<Dtype>*>& bottom);
 
-    shared_ptr<MKLDNNData<Dtype> > fwd_top_data, fwd_bottom_data;
+    shared_ptr<MKLDNNData<Dtype> > fwd_top_data, fwd_bottom_data, bwd_bottom_data;
     shared_ptr<MKLDNNDiff<Dtype> > bwd_top_diff, bwd_bottom_diff;
     shared_ptr<relu_forward::primitive_desc> reluFwd_pd;
     shared_ptr<relu_backward::primitive_desc> reluBwd_pd;
     MKLDNNPrimitive<Dtype> reluFwd, reluBwd;
     shared_ptr<memory> fwd_top_data_memory, bwd_bottom_diff_memory;
-    shared_ptr<primitive> fwd_bottom_data_primitive, bwd_top_diff_primitive;
+    shared_ptr<primitive> fwd_bottom_data_primitive, bwd_top_diff_primitive, bwd_bottom_data_primitive;
     int32_t num_, width_, height_, channels_;
 
     PERFORMANCE_EVENT_ID_DECL(perf_id_fw_);
diff --git a/src/caffe/layers/mkldnn_convolution_layer.cpp b/src/caffe/layers/mkldnn_convolution_layer.cpp
index 1ac34b5fb..991b32eb7 100644
--- a/src/caffe/layers/mkldnn_convolution_layer.cpp
+++ b/src/caffe/layers/mkldnn_convolution_layer.cpp
@@ -578,6 +578,8 @@ void MKLDNNConvolutionLayer<Dtype>::Backward_cpu(const vector<Blob<Dtype>*>& top
                                                 , const vector<Blob<Dtype>*>& bottom)
 {
     VLOG(1) << "MKLDNNConvolutionLayer<Dtype>::Backward_cpu: " << this->layer_param_.name();
+    bool top_diff_is_prv = (const_cast<Dtype*>(top[0]->prv_diff()) != NULL);
+
     if( convBwdData_pd == NULL || this->reshape)
         InitConvolutionBwd(top, propagate_down, bottom);
     if (propagate_down[0]) {
@@ -636,6 +638,13 @@ void MKLDNNConvolutionLayer<Dtype>::Backward_cpu(const vector<Blob<Dtype>*>& top
         PERFORMANCE_MEASUREMENT_END_ID(perf_id_bw_);
     }
     if (this->param_propagate_down(0)) {
+        // We have to sync top diff to cpu explicitly. This is used to make
+        // bwdw_top_diff->sync_before_read() have chance to get coverted data as
+        // bwdd_top_diff->sync_before_read() have updated top diff's prv_data
+        // to self. This issue only happens when MKLDNN conv layer is followed
+        // by a CAFFE layer and conversion is needed.
+        if (!top_diff_is_prv && propagate_down[0])
+          top[0]->mutable_cpu_diff();
         // making reorders if needed.
         bwdw_top_diff->sync_before_read();
         bwdw_bottom_data->sync_before_read();
diff --git a/src/caffe/layers/mkldnn_inner_product_layer.cpp b/src/caffe/layers/mkldnn_inner_product_layer.cpp
index 1c7def27d..7c48547b6 100644
--- a/src/caffe/layers/mkldnn_inner_product_layer.cpp
+++ b/src/caffe/layers/mkldnn_inner_product_layer.cpp
@@ -530,6 +530,7 @@ void MKLDNNInnerProductLayer<Dtype>::Backward_cpu(const vector<Blob<Dtype>*>& to
 #ifdef DEBUG
     LOG(INFO) << "MKLDNNInnerProductLayer<Dtype>::Backward_cpu: " << this->layer_param_.name();
 #endif
+    bool top_diff_is_prv = (const_cast<Dtype*>(top[0]->prv_diff()) != NULL);
 
     if( ipBwdData_pd == NULL || this->reshape)
         InitInnerProductBwd(top, propagate_down, bottom);
@@ -590,6 +591,13 @@ void MKLDNNInnerProductLayer<Dtype>::Backward_cpu(const vector<Blob<Dtype>*>& to
         PERFORMANCE_MEASUREMENT_END_ID(perf_id_bw_);
     }
     if (this->param_propagate_down(0)) {
+        // We have to sync top diff to cpu explicitly. This is used to make
+        // bwdw_top_diff->sync_before_read() have chance to get coverted data as
+        // bwdd_top_diff->sync_before_read() have updated top diff's prv_data
+        // to self. This issue only happens when MKLDNN innerproduct layer is
+        // followed by a CAFFE layer and conversion is needed.
+        if (!top_diff_is_prv && propagate_down[0])
+          top[0]->mutable_cpu_diff();
         // making reorders if needed.
         bwdw_top_diff->sync_before_read();
         bwdw_bottom_data->sync_before_read();
diff --git a/src/caffe/layers/mkldnn_relu_layer.cpp b/src/caffe/layers/mkldnn_relu_layer.cpp
index e21b24a5c..364063f12 100644
--- a/src/caffe/layers/mkldnn_relu_layer.cpp
+++ b/src/caffe/layers/mkldnn_relu_layer.cpp
@@ -203,6 +203,21 @@ void MKLDNNReLULayer<Dtype>::InitReLUBwd(const vector<Blob<Dtype>*>& top
     shared_ptr<memory::primitive_desc> usr_diff_mpd = NULL;
     shared_ptr<memory::primitive_desc> prv_diff_mpd = NULL;
 
+    bool bottom_data_is_prv = (const_cast<Dtype*>(bottom[0]->prv_data()) != NULL);
+
+    // ---- Initialize memory descriptors -------------
+    shared_ptr<memory::desc> bottom_data_md;
+    shared_ptr<memory::primitive_desc> usr_data_mpd(NULL), prv_data_mpd(NULL);
+    if (bottom_data_is_prv) {
+        shared_ptr<MKLDNNMemoryDescriptor<Dtype, false> > mem_descr
+            = get_mkldnn_prv_descriptor<Dtype, false>(bottom[0]);
+        usr_data_mpd = mem_descr->usr_memory_pd();
+        prv_data_mpd = mem_descr->prv_memory_pd();
+    } else {
+        bottom_data_md.reset(new memory::desc({{n, ic, ih, iw}}, mpcsn, memory::format::nchw));
+        usr_data_mpd.reset(new memory::primitive_desc(*bottom_data_md, cpu_engine));
+    }
+
     if (top_diff_is_prv) {
       shared_ptr<MKLDNNMemoryDescriptor<Dtype, /* is_diff */ true> > mem_descr
         = get_mkldnn_prv_descriptor<Dtype, /* is_diff */ true>(top[0]);
@@ -286,11 +301,15 @@ void MKLDNNReLULayer<Dtype>::InitReLUBwd(const vector<Blob<Dtype>*>& top
     bwd_top_diff->name = "bwd_top_diff_data   @ " + this->layer_param_.name();
     bwd_top_diff_primitive = bwd_top_diff->create_input(/* set_prv_ptr */ false);
 
+    bwd_bottom_data.reset(new MKLDNNData<Dtype>(usr_data_mpd, prv_data_mpd, bottom[0], this));
+    bwd_bottom_data->name = "bwd_bottom_data   @ " + this->layer_param_.name();
+    bwd_bottom_data_primitive = bwd_bottom_data->create_input(/* set_prv_ptr */ false);
+
     bwd_bottom_diff.reset(new MKLDNNDiff<Dtype>(usr_diff_mpd, prv_diff_mpd, bottom[0], this));
     bwd_bottom_diff->name = "bwd_bottom_diff_data   @ " + this->layer_param_.name();
     bwd_bottom_diff_memory = bwd_bottom_diff->create_output_memory(inplace);
 
-    reluBwd.reset(new relu_backward(*reluBwd_pd, *fwd_bottom_data_primitive, *bwd_top_diff_primitive, *bwd_bottom_diff_memory));
+    reluBwd.reset(new relu_backward(*reluBwd_pd, *bwd_bottom_data_primitive, *bwd_top_diff_primitive, *bwd_bottom_diff_memory));
     //bwd_top_diff->set_mkldnn_primitive(reluBwd);          //Wrong passed primitive! (TODO: Checking!)
     MKLDNNPrimitive<Dtype> bwd_top_diff_primitive_transfer(bwd_top_diff_primitive);
     bwd_top_diff->set_mkldnn_primitive(bwd_top_diff_primitive_transfer);
@@ -319,6 +338,7 @@ void MKLDNNReLULayer<Dtype>::Backward_cpu(const vector<Blob<Dtype>*>& top
     }
 
     bwd_top_diff->sync_before_read();
+    bwd_bottom_data->sync_before_read();
     //For MKLDNN, it always create two memory for input and output
     //For Intel Caffe, if we set the inplace flag to true, input and output will use one same buffer
     //Then the update of output will not pass to MKLDNN
diff --git a/src/caffe/mkldnn_memory.cpp b/src/caffe/mkldnn_memory.cpp
index 13691c4bb..9601e41ee 100644
--- a/src/caffe/mkldnn_memory.cpp
+++ b/src/caffe/mkldnn_memory.cpp
@@ -323,7 +323,7 @@ void MKLDNNMemoryDescriptor<Dtype, is_diff>::sync_before_read()
         this->convert_to_prv(const_cast<Dtype*>(is_diff ? this->_blob->cpu_diff() : this->_blob->cpu_data()));
         // if blob has not prv descriptor then set it to avoid conversions on next iterations
         if (is_diff) {
-            this->_blob->set_prv_diff_descriptor(this->get_shared_ptr(), false);
+            this->_blob->set_prv_diff_descriptor(this->get_shared_ptr(), true);
             // Original:
             // below line designated to set correspondent SyncedMemory->_head to HEAD_AT_CPU
             // TODO: need to optimize

From 3823cb3c716119721fe31a50ed464246821ca95a Mon Sep 17 00:00:00 2001
From: "Yu, Chong" <chong.yu@intel.com>
Date: Mon, 25 Dec 2017 19:04:27 +0800
Subject: [PATCH 22/53] Roll the MKLDNN version back to aab753280e to avoid
 performance regression.

---
 mkldnn.commit | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/mkldnn.commit b/mkldnn.commit
index ed29e5f9d..49f70144e 100644
--- a/mkldnn.commit
+++ b/mkldnn.commit
@@ -1 +1 @@
-82cf37f626a0998d38f99c30e5a08a0dd5e49bc0
\ No newline at end of file
+aab753280e83137ba955f8f19d72cb6aaba545ef
\ No newline at end of file

From 06383c1c2c07ba211969fbadd3b4b129fa8edde1 Mon Sep 17 00:00:00 2001
From: fzou1 <feng.zou@intel.com>
Date: Tue, 26 Dec 2017 11:12:36 +0800
Subject: [PATCH 23/53] fix build issue of latest mkldnn

---
 Makefile | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/Makefile b/Makefile
index 10a10a1d9..2f488be0c 100644
--- a/Makefile
+++ b/Makefile
@@ -336,6 +336,9 @@ endif
 ifdef CUSTOM_CXX
 	CXX := $(CUSTOM_CXX)
 endif
+ifdef CUSTOM_CC
+	CC := $(CUSTOM_CC)
+endif
 
 # Linux
 ifeq ($(LINUX), 1)

From 141827eff1b1c7dd28e97f9d855508d991feb77d Mon Sep 17 00:00:00 2001
From: fzou1 <feng.zou@intel.com>
Date: Tue, 26 Dec 2017 15:06:05 +0800
Subject: [PATCH 24/53] move layer timing macro out of USE_MLSL macro as it can
 be used for single node performance measurement, and fix compilation issues

---
 Makefile                 | 7 +++----
 cmake/Dependencies.cmake | 7 ++++---
 src/caffe/net.cpp        | 2 +-
 src/caffe/solver.cpp     | 2 ++
 4 files changed, 10 insertions(+), 8 deletions(-)

diff --git a/Makefile b/Makefile
index 2f488be0c..03df628e4 100644
--- a/Makefile
+++ b/Makefile
@@ -60,6 +60,9 @@ else
 	OTHER_BUILD_DIR := $(DEBUG_BUILD_DIR)
 endif
 
+ifeq ($(CAFFE_PER_LAYER_TIMINGS), 1)
+	COMMON_FLAGS += -DCAFFE_PER_LAYER_TIMINGS
+endif
 
 #################### MLSL ####################
 
@@ -79,10 +82,6 @@ endif
 	IGNORE := $(shell bash -c "source $(MLSL_ROOT)/intel64/bin/mlslvars.sh; env | sed 's/=/:=/' | sed 's/^/export /' > make_mlsl_env")
 	include make_mlsl_env
 
-ifeq ($(CAFFE_PER_LAYER_TIMINGS), 1)
-	COMMON_FLAGS += -DCAFFE_PER_LAYER_TIMINGS
-endif
-
 ifeq ($(CAFFE_MLSL_SHUFFLE), 1)
 	COMMON_FLAGS += -DCAFFE_MLSL_SHUFFLE
 endif
diff --git a/cmake/Dependencies.cmake b/cmake/Dependencies.cmake
index bd0127afc..08738b6c2 100644
--- a/cmake/Dependencies.cmake
+++ b/cmake/Dependencies.cmake
@@ -94,6 +94,10 @@ if(USE_OPENCV)
   add_definitions(-DUSE_OPENCV)
 endif()
 
+if(CAFFE_PER_LAYER_TIMINGS)
+  add_definitions("-DCAFFE_PER_LAYER_TIMINGS")
+endif()
+
 # ---[ MLSL
 if(USE_MLSL)
   if (NOT CPU_ONLY)
@@ -120,9 +124,6 @@ if(USE_MLSL)
   link_directories(SYSTEM "${MLSL_ROOT}/intel64/lib")
   list(APPEND Caffe_LINKER_LIBS mlsl)
 
-  if(CAFFE_PER_LAYER_TIMINGS)
-    add_definitions("-DCAFFE_PER_LAYER_TIMINGS")
-  endif()
   if(CAFFE_MLSL_SHUFFLE)
     add_definitions("-DCAFFE_MLSL_SHUFFLE")
   endif()
diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
index 49e35f699..dd0fa03cf 100644
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -2033,8 +2033,8 @@ void Net<Dtype>::PrintTimers(bool printTotal) {
     startcomm_time_per_layer_total : startcomm_time_per_layer;
   std::vector<double>& waitcomm_timers = printTotal ?
     waitcomm_time_per_layer_total : waitcomm_time_per_layer;
-  std::string prefix = printTotal ? "TOTAL " : "DELTA ";
 #endif
+  std::string prefix = printTotal ? "TOTAL " : "DELTA ";
 
   double forward_time = std::accumulate(forward_timers.begin(),
       forward_timers.end(), 0.0) / 1000.0;
diff --git a/src/caffe/solver.cpp b/src/caffe/solver.cpp
index aad9e3596..2b47b0b2e 100644
--- a/src/caffe/solver.cpp
+++ b/src/caffe/solver.cpp
@@ -357,7 +357,9 @@ void Solver<Dtype>::Step(int iters) {
     net_->PrintTimers(false);
     net_->ResetTimers();
 
+#ifdef USE_MLSL
     if (mn::get_node_id() == 0)
+#endif
         LOG(INFO) << "iter " << iter_ << ", forward_backward_update_time: "
                 << iter_time << " ms";
 #endif

From f32f4d12ccdc49492095d8218aefa4b70ea0502c Mon Sep 17 00:00:00 2001
From: "Yu, Chong" <chong.yu@intel.com>
Date: Tue, 26 Dec 2017 15:08:17 +0800
Subject: [PATCH 25/53] Fix the ASSERT '0' FAILED: specify MLSL_ROOT in CMake
 process.

---
 cmake/Dependencies.cmake |  1 +
 src/caffe/net.cpp        | 10 ++++++++++
 2 files changed, 11 insertions(+)

diff --git a/cmake/Dependencies.cmake b/cmake/Dependencies.cmake
index 08738b6c2..c01daa1a3 100644
--- a/cmake/Dependencies.cmake
+++ b/cmake/Dependencies.cmake
@@ -120,6 +120,7 @@ if(USE_MLSL)
   endif()
   message(STATUS "Machine Learning Scaling Library (MLSL) found (${MLSL_ROOT}/intel64)")
   add_definitions("-DUSE_MLSL=1")
+  add_definitions("-DFOUNDED_MLSL_ROOT=${MLSL_ROOT}")
   include_directories(SYSTEM "${MLSL_ROOT}/intel64/include")
   link_directories(SYSTEM "${MLSL_ROOT}/intel64/lib")
   list(APPEND Caffe_LINKER_LIBS mlsl)
diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
index dd0fa03cf..2118394ec 100644
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -2249,3 +2249,13 @@ void Net<Dtype>::PrintPayloadSize() {
 INSTANTIATE_CLASS(Net);
 
 }  // namespace caffe
+
+#if defined(FOUNDED_MLSL_ROOT)
+#define DEF_MLSL(str) \
+const char *mlsl_root = #str; 
+
+__attribute__((constructor)) void lib_ctor()  {
+    DEF_MLSL(FOUNDED_MLSL_ROOT);
+    setenv("MLSL_ROOT", mlsl_root, 0);
+}
+#endif

From 6397ea38d511adf5aad856c728339e73bae91e22 Mon Sep 17 00:00:00 2001
From: "Yu, Chong" <chong.yu@intel.com>
Date: Tue, 26 Dec 2017 22:49:15 +0800
Subject: [PATCH 26/53] Fix error while loading shared libraries libmlsl.so.1
 in make process.

---
 Makefile | 17 ++++++++---------
 1 file changed, 8 insertions(+), 9 deletions(-)

diff --git a/Makefile b/Makefile
index 03df628e4..a710983d4 100644
--- a/Makefile
+++ b/Makefile
@@ -74,13 +74,12 @@ endif
 
 	RETURN_STRING=$(shell ./external/mlsl/prepare_mlsl.sh)
 	MLSL_ROOT=$(firstword $(RETURN_STRING))
-	MLSL_LDFLAGS=$(lastword $(RETURN_STRING))
+	MLSL_LDFLAGS:=-lmpi -l$(lastword $(RETURN_STRING)) -Wl,-rpath,$(MLSL_ROOT)/intel64/lib
 	COMMON_FLAGS += -DUSE_MLSL=1
-	LIBRARIES += mlsl
+	LIBRARIES += mlsl mpi
 	INCLUDE_DIRS += $(MLSL_ROOT)/intel64/include
 	LIBRARY_DIRS += $(MLSL_ROOT)/intel64/lib
-	IGNORE := $(shell bash -c "source $(MLSL_ROOT)/intel64/bin/mlslvars.sh; env | sed 's/=/:=/' | sed 's/^/export /' > make_mlsl_env")
-	include make_mlsl_env
+	COMMON_FLAGS += -DFOUNDED_MLSL_ROOT=$(MLSL_ROOT)
 
 ifeq ($(CAFFE_MLSL_SHUFFLE), 1)
 	COMMON_FLAGS += -DCAFFE_MLSL_SHUFFLE
@@ -779,7 +778,7 @@ $(ALL_BUILD_DIRS): | $(BUILD_DIR_LINK)
 
 $(DYNAMIC_NAME): $(OBJS) | $(LIB_BUILD_DIR)
 	@ echo LD -o $@
-	$(Q)$(CXX) -shared -o $@ $(OBJS) $(VERSIONFLAGS) $(BOOST_LDFLAGS) $(LINKFLAGS) $(MKL_LDFLAGS) $(MKLDNN_LDFLAGS) $(DLCP_LDFLAGS) $(CXX_HARDENING_FLAGS) $(LINKER_SHARED_HARDENING_FLAGS) $(LDFLAGS)
+	$(Q)$(CXX) -shared -o $@ $(OBJS) $(VERSIONFLAGS) $(BOOST_LDFLAGS) $(LINKFLAGS) $(MKL_LDFLAGS) $(MLSL_LDFLAGS) $(MKLDNN_LDFLAGS) $(DLCP_LDFLAGS) $(CXX_HARDENING_FLAGS) $(LINKER_SHARED_HARDENING_FLAGS) $(LDFLAGS)
 	@ cd $(BUILD_DIR)/lib; rm -f $(DYNAMIC_NAME_SHORT);   ln -s $(DYNAMIC_VERSIONED_NAME_SHORT) $(DYNAMIC_NAME_SHORT)
 
 $(STATIC_NAME): $(OBJS) | $(LIB_BUILD_DIR)
@@ -811,7 +810,7 @@ $(TEST_ALL_BIN): $(TEST_MAIN_SRC) $(TEST_OBJS) $(GTEST_OBJS) \
 		| $(DYNAMIC_NAME) $(TEST_BIN_DIR)
 	@ echo CXX/LD -o $@ $<
 	$(Q)$(CXX) -std=c++11 $(TEST_MAIN_SRC) $(TEST_OBJS) $(GTEST_OBJS) \
-		-o $@ $(BOOST_LDFLAGS) $(LINKFLAGS) $(MKL_LDFLAGS) $(MKLDNN_LDFLAGS) $(DLCP_LDFLAGS) $(CXX_HARDENING_FLAGS) $(LINKER_EXEC_HARDENING_FLAGS) $(LDFLAGS) -l$(LIBRARY_NAME) -Wl,-rpath,$(ORIGIN)/../lib
+		-o $@ $(BOOST_LDFLAGS) $(LINKFLAGS) $(MKL_LDFLAGS) $(MLSL_LDFLAGS) $(MKLDNN_LDFLAGS) $(DLCP_LDFLAGS) $(CXX_HARDENING_FLAGS) $(LINKER_EXEC_HARDENING_FLAGS) $(LDFLAGS) -l$(LIBRARY_NAME) -Wl,-rpath,$(ORIGIN)/../lib
 
 $(TEST_CU_BINS): $(TEST_BIN_DIR)/%.testbin: $(TEST_CU_BUILD_DIR)/%.o \
 	$(GTEST_OBJS) | $(DYNAMIC_NAME) $(TEST_BIN_DIR)
@@ -823,7 +822,7 @@ $(TEST_CXX_BINS): $(TEST_BIN_DIR)/%.testbin: $(TEST_CXX_BUILD_DIR)/%.o \
 	$(GTEST_OBJS) | $(DYNAMIC_NAME) $(TEST_BIN_DIR)
 	@ echo LD $<
 	$(Q)$(CXX) -std=c++11 $(TEST_MAIN_SRC) $< $(GTEST_OBJS) \
-		-o $@ $(BOOST_LDFLAGS) $(LINKFLAGS) $(MKL_LDFLAGS) $(MKLDNN_LDFLAGS) $(DLCP_LDFLAGS) $(CXX_HARDENING_FLAGS) $(LINKER_EXEC_HARDENING_FLAGS) $(LDFLAGS) -l$(LIBRARY_NAME) -Wl,-rpath,$(ORIGIN)/../lib
+		-o $@ $(BOOST_LDFLAGS) $(LINKFLAGS) $(MKL_LDFLAGS) $(MLSL_LDFLAGS) $(MKLDNN_LDFLAGS) $(DLCP_LDFLAGS) $(CXX_HARDENING_FLAGS) $(LINKER_EXEC_HARDENING_FLAGS) $(LDFLAGS) -l$(LIBRARY_NAME) -Wl,-rpath,$(ORIGIN)/../lib
 
 # Target for extension-less symlinks to tool binaries with extension '*.bin'.
 $(TOOL_BUILD_DIR)/%: $(TOOL_BUILD_DIR)/%.bin | $(TOOL_BUILD_DIR)
@@ -832,12 +831,12 @@ $(TOOL_BUILD_DIR)/%: $(TOOL_BUILD_DIR)/%.bin | $(TOOL_BUILD_DIR)
 
 $(TOOL_BINS): %.bin : %.o | $(DYNAMIC_NAME)
 	@ echo CXX/LD -o $@
-	$(Q)$(CXX) $< -o $@ $(BOOST_LDFLAGS) $(LINKFLAGS) $(MKL_LDFLAGS) $(MKLDNN_LDFLAGS) $(DLCP_LDFLAGS) $(CXX_HARDENING_FLAGS) $(LINKER_EXEC_HARDENING_FLAGS) -l$(LIBRARY_NAME) $(LDFLAGS) \
+	$(Q)$(CXX) $< -o $@ $(BOOST_LDFLAGS) $(LINKFLAGS) $(MKL_LDFLAGS) $(MLSL_LDFLAGS) $(MKLDNN_LDFLAGS) $(DLCP_LDFLAGS) $(CXX_HARDENING_FLAGS) $(LINKER_EXEC_HARDENING_FLAGS) -l$(LIBRARY_NAME) $(LDFLAGS) \
 		-Wl,-rpath,$(ORIGIN)/../lib
 
 $(EXAMPLE_BINS): %.bin : %.o | $(DYNAMIC_NAME)
 	@ echo CXX/LD -o $@
-	$(Q)$(CXX) $< -o $@ $(BOOST_LDFLAGS) $(LINKFLAGS) $(MKL_LDFLAGS) $(MKLDNN_LDFLAGS) $(DLCP_LDFLAGS) $(CXX_HARDENING_FLAGS) $(LINKER_EXEC_HARDENING_FLAGS) -l$(LIBRARY_NAME) $(LDFLAGS) \
+	$(Q)$(CXX) $< -o $@ $(BOOST_LDFLAGS) $(LINKFLAGS) $(MKL_LDFLAGS) $(MLSL_LDFLAGS) $(MKLDNN_LDFLAGS) $(DLCP_LDFLAGS) $(CXX_HARDENING_FLAGS) $(LINKER_EXEC_HARDENING_FLAGS) -l$(LIBRARY_NAME) $(LDFLAGS) \
 		-Wl,-rpath,$(ORIGIN)/../../lib
 
 proto: $(PROTO_GEN_CC) $(PROTO_GEN_HEADER)

From 6cc851dcc8e8c550a3c343670c776005fccdaba8 Mon Sep 17 00:00:00 2001
From: Feng Tian <feng.tian@intel.com>
Date: Wed, 27 Dec 2017 11:20:42 +0800
Subject: [PATCH 27/53] set CPU_ONLY to ON by default in CMAKE build

---
 CMakeLists.txt | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 5a700f273..8ab712cf7 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -26,7 +26,7 @@ include(cmake/Summary.cmake)
 include(cmake/ConfigGen.cmake)
 
 # ---[ Options
-caffe_option(CPU_ONLY  "Build Caffe without CUDA support" OFF) # TODO: rename to USE_CUDA
+caffe_option(CPU_ONLY  "Build Caffe without CUDA support" ON) # TODO: rename to USE_CUDA
 caffe_option(USE_OPENMP "Build Caffe with OpenMP support" ON )
 caffe_option(USE_CUDNN "Build Caffe with cuDNN library support" ON IF NOT CPU_ONLY)
 caffe_option(USE_MKL2017_AS_DEFAULT_ENGINE "Use MKL2017 primitives for supported layers" OFF)

From 0e6b69cbf140300848a55fbe89e51d8fa85a2a3f Mon Sep 17 00:00:00 2001
From: Feng Tian <feng.tian@intel.com>
Date: Wed, 27 Dec 2017 15:25:54 +0800
Subject: [PATCH 28/53] update SSD topologies to use pure MKLDNN engine.

---
 .../ssd/AlexNet/VOC0712/SSD_300x300/deploy.prototxt            | 3 ---
 .../ssd/AlexNet/VOC0712/SSD_300x300/test.prototxt              | 3 ---
 .../ssd/AlexNet/VOC0712/SSD_300x300/train.prototxt             | 3 ---
 .../ssd/VGGNet/VOC0712/SSD_300x300/deploy.prototxt             | 3 ---
 .../ssd/VGGNet/VOC0712/SSD_300x300/test.prototxt               | 3 ---
 .../ssd/VGGNet/VOC0712/SSD_300x300/train.prototxt              | 3 ---
 .../ssd/VGGNet/VOC0712/SSD_300x300_webcam/test.prototxt        | 3 ---
 .../ssd/VGGNet/coco/SSD_300x300/deploy.prototxt                | 3 ---
 .../ssd/VGGNet/coco/SSD_300x300/test.prototxt                  | 3 ---
 .../ssd/VGGNet/coco/SSD_300x300/train.prototxt                 | 3 ---
 .../ssd/VGGNet/coco/SSD_300x300_webcam/test.prototxt           | 3 ---
 11 files changed, 33 deletions(-)

diff --git a/models/intel_optimized_models/ssd/AlexNet/VOC0712/SSD_300x300/deploy.prototxt b/models/intel_optimized_models/ssd/AlexNet/VOC0712/SSD_300x300/deploy.prototxt
index d37915e26..658dda5c9 100644
--- a/models/intel_optimized_models/ssd/AlexNet/VOC0712/SSD_300x300/deploy.prototxt
+++ b/models/intel_optimized_models/ssd/AlexNet/VOC0712/SSD_300x300/deploy.prototxt
@@ -1326,7 +1326,6 @@ layer {
   concat_param {
     axis: 1
   }
-    engine: "CAFFE"
 }
 layer {
   name: "mbox_conf"
@@ -1341,7 +1340,6 @@ layer {
   concat_param {
     axis: 1
   }
-    engine: "CAFFE"
 }
 layer {
   name: "mbox_priorbox"
@@ -1356,7 +1354,6 @@ layer {
   concat_param {
     axis: 2
   }
-  engine: "CAFFE"
 }
 layer {
   name: "mbox_conf_reshape"
diff --git a/models/intel_optimized_models/ssd/AlexNet/VOC0712/SSD_300x300/test.prototxt b/models/intel_optimized_models/ssd/AlexNet/VOC0712/SSD_300x300/test.prototxt
index 0eac716a0..167b34ab3 100644
--- a/models/intel_optimized_models/ssd/AlexNet/VOC0712/SSD_300x300/test.prototxt
+++ b/models/intel_optimized_models/ssd/AlexNet/VOC0712/SSD_300x300/test.prototxt
@@ -1350,7 +1350,6 @@ layer {
   concat_param {
     axis: 1
   }
-    engine: "CAFFE"
 }
 layer {
   name: "mbox_conf"
@@ -1365,7 +1364,6 @@ layer {
   concat_param {
     axis: 1
   }
-    engine: "CAFFE"
 }
 layer {
   name: "mbox_priorbox"
@@ -1380,7 +1378,6 @@ layer {
   concat_param {
     axis: 2
   }
-  engine: "CAFFE"
 }
 layer {
   name: "mbox_conf_reshape"
diff --git a/models/intel_optimized_models/ssd/AlexNet/VOC0712/SSD_300x300/train.prototxt b/models/intel_optimized_models/ssd/AlexNet/VOC0712/SSD_300x300/train.prototxt
index d8bac9b7f..1f82b813f 100644
--- a/models/intel_optimized_models/ssd/AlexNet/VOC0712/SSD_300x300/train.prototxt
+++ b/models/intel_optimized_models/ssd/AlexNet/VOC0712/SSD_300x300/train.prototxt
@@ -1455,7 +1455,6 @@ layer {
   concat_param {
     axis: 1
   }
-    engine: "CAFFE"
 }
 layer {
   name: "mbox_conf"
@@ -1470,7 +1469,6 @@ layer {
   concat_param {
     axis: 1
   }
-    engine: "CAFFE"
 }
 layer {
   name: "mbox_priorbox"
@@ -1485,7 +1483,6 @@ layer {
   concat_param {
     axis: 2
   }
-  engine: "CAFFE"
 }
 layer {
   name: "mbox_loss"
diff --git a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/deploy.prototxt b/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/deploy.prototxt
index dfe14b516..733229e89 100644
--- a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/deploy.prototxt
+++ b/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/deploy.prototxt
@@ -1535,7 +1535,6 @@ layer {
   concat_param {
     axis: 1
   }
-  engine: "CAFFE"
 }
 layer {
   name: "mbox_conf"
@@ -1550,7 +1549,6 @@ layer {
   concat_param {
     axis: 1
   }
-  engine: "CAFFE"
 }
 layer {
   name: "mbox_priorbox"
@@ -1565,7 +1563,6 @@ layer {
   concat_param {
     axis: 2
   }
-  engine: "CAFFE"
 }
 layer {
   name: "mbox_conf_reshape"
diff --git a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/test.prototxt b/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/test.prototxt
index 38152e56a..a9d4e83a9 100644
--- a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/test.prototxt
+++ b/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/test.prototxt
@@ -1559,7 +1559,6 @@ layer {
   concat_param {
     axis: 1
   }
-    engine: "CAFFE"
 }
 layer {
   name: "mbox_conf"
@@ -1574,7 +1573,6 @@ layer {
   concat_param {
     axis: 1
   }
-    engine: "CAFFE"
 }
 layer {
   name: "mbox_priorbox"
@@ -1589,7 +1587,6 @@ layer {
   concat_param {
     axis: 2
   }
-  engine: "CAFFE"
 }
 layer {
   name: "mbox_conf_reshape"
diff --git a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/train.prototxt b/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/train.prototxt
index 451a5bad9..ee6685520 100644
--- a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/train.prototxt
+++ b/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300/train.prototxt
@@ -1664,7 +1664,6 @@ layer {
   concat_param {
     axis: 1
   }
-    engine: "CAFFE"
 }
 layer {
   name: "mbox_conf"
@@ -1679,7 +1678,6 @@ layer {
   concat_param {
     axis: 1
   }
-    engine: "CAFFE"
 }
 layer {
   name: "mbox_priorbox"
@@ -1694,7 +1692,6 @@ layer {
   concat_param {
     axis: 2
   }
-  engine: "CAFFE"
 }
 layer {
   name: "mbox_loss"
diff --git a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300_webcam/test.prototxt b/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300_webcam/test.prototxt
index eaff4c56e..720ffd850 100644
--- a/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300_webcam/test.prototxt
+++ b/models/intel_optimized_models/ssd/VGGNet/VOC0712/SSD_300x300_webcam/test.prototxt
@@ -1552,7 +1552,6 @@ layer {
   top: "mbox_loc"
   concat_param {
     axis: 1
-    engine: CAFFE
   }
 }
 layer {
@@ -1567,7 +1566,6 @@ layer {
   top: "mbox_conf"
   concat_param {
     axis: 1
-    engine: CAFFE
   }
 }
 layer {
@@ -1582,7 +1580,6 @@ layer {
   top: "mbox_priorbox"
   concat_param {
     axis: 2
-    engine: CAFFE
   }
 }
 layer {
diff --git a/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300/deploy.prototxt b/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300/deploy.prototxt
index fb56a59f1..1ae54d997 100644
--- a/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300/deploy.prototxt
+++ b/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300/deploy.prototxt
@@ -1534,7 +1534,6 @@ layer {
   top: "mbox_loc"
   concat_param {
     axis: 1
-    engine: CAFFE
   }
 }
 layer {
@@ -1549,7 +1548,6 @@ layer {
   top: "mbox_conf"
   concat_param {
     axis: 1
-    engine: CAFFE
   }
 }
 layer {
@@ -1564,7 +1562,6 @@ layer {
   top: "mbox_priorbox"
   concat_param {
     axis: 2
-    engine: CAFFE
   }
 }
 layer {
diff --git a/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300/test.prototxt b/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300/test.prototxt
index 97e83c7f0..4d8704801 100644
--- a/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300/test.prototxt
+++ b/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300/test.prototxt
@@ -1559,7 +1559,6 @@ layer {
   top: "mbox_loc"
   concat_param {
     axis: 1
-    engine: CAFFE
   }
 }
 layer {
@@ -1574,7 +1573,6 @@ layer {
   top: "mbox_conf"
   concat_param {
     axis: 1
-    engine: CAFFE
   }
 }
 layer {
@@ -1589,7 +1587,6 @@ layer {
   top: "mbox_priorbox"
   concat_param {
     axis: 2
-    engine: CAFFE
   }
 }
 layer {
diff --git a/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300/train.prototxt b/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300/train.prototxt
index ef92f1da9..698e0f669 100644
--- a/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300/train.prototxt
+++ b/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300/train.prototxt
@@ -1664,7 +1664,6 @@ layer {
   top: "mbox_loc"
   concat_param {
     axis: 1
-    engine: CAFFE
   }
 }
 layer {
@@ -1679,7 +1678,6 @@ layer {
   top: "mbox_conf"
   concat_param {
     axis: 1
-    engine: CAFFE
   }
 }
 layer {
@@ -1694,7 +1692,6 @@ layer {
   top: "mbox_priorbox"
   concat_param {
     axis: 2
-    engine: CAFFE
   }
 }
 layer {
diff --git a/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300_webcam/test.prototxt b/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300_webcam/test.prototxt
index c78dcccb3..4c9a9db88 100644
--- a/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300_webcam/test.prototxt
+++ b/models/intel_optimized_models/ssd/VGGNet/coco/SSD_300x300_webcam/test.prototxt
@@ -1552,7 +1552,6 @@ layer {
   top: "mbox_loc"
   concat_param {
     axis: 1
-    engine: CAFFE
   }
 }
 layer {
@@ -1567,7 +1566,6 @@ layer {
   top: "mbox_conf"
   concat_param {
     axis: 1
-    engine: CAFFE
   }
 }
 layer {
@@ -1582,7 +1580,6 @@ layer {
   top: "mbox_priorbox"
   concat_param {
     axis: 2
-    engine: CAFFE
   }
 }
 layer {

From fb26b339fdfbd55b194239291d12a24c828b2354 Mon Sep 17 00:00:00 2001
From: Haihao Shen <haihao.shen@intel.com>
Date: Thu, 28 Dec 2017 01:54:25 +0800
Subject: [PATCH 29/53] Fix label smoothing using right math utility functions

---
 src/caffe/layers/softmax_loss_layer.cpp | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/src/caffe/layers/softmax_loss_layer.cpp b/src/caffe/layers/softmax_loss_layer.cpp
index 1ac0cf6b8..b9e3fc3b8 100644
--- a/src/caffe/layers/softmax_loss_layer.cpp
+++ b/src/caffe/layers/softmax_loss_layer.cpp
@@ -226,7 +226,8 @@ void SoftmaxWithLossLayer<Dtype>::Backward_cpu(const vector<Blob<Dtype>*>& top,
           ratio = (alpha  + (dim - 1) * beta);
           // for label true, alpha - yi (alpha + (N-1) * beta)
           // for label false, beta - yj (alpha + (N-1) * beta)
-          caffe_cpu_axpby(bottom[0]->count(), Dtype(ratio), bottom_diff, Dtype(-beta), bottom_diff);
+          caffe_scal(bottom[0]->count(), Dtype(ratio), bottom_diff);
+          caffe_add_scalar(bottom[0]->count(), Dtype(-beta), bottom_diff);
         }
         Dtype weight_sum = Dtype(0);
         const Dtype* weights = bottom[2]->cpu_data();
@@ -263,7 +264,8 @@ void SoftmaxWithLossLayer<Dtype>::Backward_cpu(const vector<Blob<Dtype>*>& top,
           ratio = (alpha  + (dim - 1) * beta);
           // for label true, alpha - yi (alpha + (N-1) * beta)
           // for label false, beta - yj (alpha + (N-1) * beta)
-          caffe_cpu_axpby(bottom[0]->count(), Dtype(ratio), bottom_diff, Dtype(-beta), bottom_diff);
+          caffe_scal(bottom[0]->count(), Dtype(ratio), bottom_diff);
+          caffe_add_scalar(bottom[0]->count(), Dtype(-beta), bottom_diff);
         }
         int count = 0;
         for (int i = 0; i < outer_num_; ++i) {

From 6df7362cc1ec1798f183e14efc012e55ffd3b58d Mon Sep 17 00:00:00 2001
From: fzou1 <feng.zou@intel.com>
Date: Tue, 2 Jan 2018 09:50:03 +0800
Subject: [PATCH 30/53] move layer timing flag out of multinode flag in build
 script

---
 scripts/build_intelcaffe.sh | 14 ++++++++------
 1 file changed, 8 insertions(+), 6 deletions(-)

diff --git a/scripts/build_intelcaffe.sh b/scripts/build_intelcaffe.sh
index 168d04fc3..a29da73dc 100755
--- a/scripts/build_intelcaffe.sh
+++ b/scripts/build_intelcaffe.sh
@@ -41,9 +41,6 @@ function build_caffe_gcc
 
     if [ $is_multinode_ -eq 1 ]; then
         echo "USE_MLSL := 1" >> Makefile.config
-        if [ $is_layer_timing -eq 1 ]; then
-            echo "CAFFE_PER_LAYER_TIMINGS := 1" >> Makefile.config
-        fi
 
         mlslvars_sh=`find external/mlsl/ -name mlslvars.sh`
         if [ -f $mlslvars_sh ]; then
@@ -51,6 +48,10 @@ function build_caffe_gcc
         fi
     fi
 
+    if [ $is_layer_timing -eq 1 ]; then
+        echo "CAFFE_PER_LAYER_TIMINGS := 1" >> Makefile.config
+    fi
+
     if [ $debug -eq 1 ]; then
         echo "DEBUG := 1" >> Makefile.config
     fi
@@ -100,9 +101,10 @@ function build_caffe_icc
     cmake_params="-DCPU_ONLY=1 -DBOOST_ROOT=$boost_root"
     if [ $is_multinode_ -eq 1 ]; then
         cmake_params+=" -DUSE_MLSL=1"
-        if [ $is_layer_timing -eq 1 ]; then
-            cmake_params+=" -DCAFFE_PER_LAYER_TIMINGS=1"
-        fi
+    fi
+
+    if [ $is_layer_timing -eq 1 ]; then
+        cmake_params+=" -DCAFFE_PER_LAYER_TIMINGS=1"
     fi
 
     if [ $debug -eq 1 ]; then

From f2c8795aea00c8c88dc5b293c099b56a2675958b Mon Sep 17 00:00:00 2001
From: Feng Tian <feng.tian@intel.com>
Date: Tue, 2 Jan 2018 10:53:48 +0800
Subject: [PATCH 31/53] sync LiuWei's SSD sampling bug fix 96175b to intel
 caffe

---
 src/caffe/util/sampler.cpp | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/src/caffe/util/sampler.cpp b/src/caffe/util/sampler.cpp
index f47a78dd8..b4fc44830 100644
--- a/src/caffe/util/sampler.cpp
+++ b/src/caffe/util/sampler.cpp
@@ -133,11 +133,11 @@ void SampleBBox(const Sampler& sampler, NormalizedBBox* sampled_bbox) {
   CHECK_GT(sampler.min_aspect_ratio(), 0.);
   CHECK_LT(sampler.max_aspect_ratio(), FLT_MAX);
   float aspect_ratio;
-  float min_aspect_ratio = std::max<float>(sampler.min_aspect_ratio(),
-                                           std::pow(scale, 2.));
-  float max_aspect_ratio = std::min<float>(sampler.max_aspect_ratio(),
-                                           1 / std::pow(scale, 2.));
-  caffe_rng_uniform(1, min_aspect_ratio, max_aspect_ratio, &aspect_ratio);
+  caffe_rng_uniform(1, sampler.min_aspect_ratio(), sampler.max_aspect_ratio(),
+      &aspect_ratio);
+
+  aspect_ratio = std::max<float>(aspect_ratio, std::pow(scale, 2.));
+  aspect_ratio = std::min<float>(aspect_ratio, 1 / std::pow(scale, 2.));
 
   // Figure out bbox dimension.
   float bbox_width = scale * sqrt(aspect_ratio);

From 017bc662b7f311dccb0d1e15e5adad776ae5473e Mon Sep 17 00:00:00 2001
From: fzou1 <feng.zou@intel.com>
Date: Tue, 2 Jan 2018 22:44:27 +0800
Subject: [PATCH 32/53] fix build issue of weight quantization + older MLSL
 version (<=2017.1.016)

---
 Makefile.dlcp                          |  5 ++++
 cmake/Dependencies.cmake               | 40 ++++++++++++++------------
 include/caffe/multinode/mlsl.hpp       | 14 +++++++--
 include/caffe/multinode/multi_sync.hpp |  6 ++++
 4 files changed, 44 insertions(+), 21 deletions(-)

diff --git a/Makefile.dlcp b/Makefile.dlcp
index c0a180327..fc239b957 100644
--- a/Makefile.dlcp
+++ b/Makefile.dlcp
@@ -42,6 +42,7 @@ endif
 endif
 
 ifeq ($(USE_MLSL), 1)
+ifneq ($(ENABLE_WEIGHT_GRAD_COMPRESSION), 0)
 ifeq ($(origin DLCPROOT), environment)
 dlcp: dlcproot_set
 else
@@ -53,6 +54,10 @@ dlcp:
 endif
 endif
 else
+dlcp:
+	@echo "disabling weight grad compression if ENABLE_WEIGHT_GRAD_COMPRESSION is set to 0"
+endif
+else
 dlcp:
 	@echo "disabling weight grad compression if USE_MLSL is not 1"
 endif
diff --git a/cmake/Dependencies.cmake b/cmake/Dependencies.cmake
index c01daa1a3..732218865 100644
--- a/cmake/Dependencies.cmake
+++ b/cmake/Dependencies.cmake
@@ -136,28 +136,30 @@ endif()
 
 # ---| DLCP
 if(USE_MLSL)
-  if(DEFINED ENV{DLCPROOT})
-    set(DLCPROOT_DIR $ENV{DLCPROOT})
-    if(NOT ${DLCPROOT_DIR} STREQUAL "")
-      set(DLCPROOT_INCLUDE_DIR "${DLCPROOT_DIR}/include/")
-      set(DLCPROOT_LIB_DIR "${DLCPROOT_DIR}/lib/")
-      if(EXISTS ${DLCPROOT_INCLUDE_DIR}/dl_compression.h AND EXISTS ${DLCPROOT_LIB_DIR}/libdlcomp.so)
-        message(STATUS "Found DLCP: ${DLCPROOT_DIR}")
+  if (ENABLE_WEIGHT_GRAD_COMPRESSION OR NOT DEFINED ENABLE_WEIGHT_GRAD_COMPRESSION)
+    if(DEFINED ENV{DLCPROOT})
+      set(DLCPROOT_DIR $ENV{DLCPROOT})
+      if(NOT ${DLCPROOT_DIR} STREQUAL "")
+        set(DLCPROOT_INCLUDE_DIR "${DLCPROOT_DIR}/include/")
+        set(DLCPROOT_LIB_DIR "${DLCPROOT_DIR}/lib/")
+        if(EXISTS ${DLCPROOT_INCLUDE_DIR}/dl_compression.h AND EXISTS ${DLCPROOT_LIB_DIR}/libdlcomp.so)
+          message(STATUS "Found DLCP: ${DLCPROOT_DIR}")
+          set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DENABLE_WEIGHT_GRAD_COMPRESSION")
+          list(APPEND Caffe_LINKER_LIBS "${DLCPROOT_LIB_DIR}/libdlcomp.so")
+          include_directories(SYSTEM ${DLCP_INCLUDE_DIR})
+        else()
+          message(STATUS "DLCP not found. DLCP_INCLUDE_DIR = ${DLCPROOT_INCLUDE_DIR} DLCP_LIB_DIR = ${DLCPROOT_LIB_DIR}")
+          message(WARNING "weight grad compression is disabled.")
+        endif()
+      endif()
+    else()
+      Download_DLCP()
+      if(DLCP_CXX)
         set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DENABLE_WEIGHT_GRAD_COMPRESSION")
-        list(APPEND Caffe_LINKER_LIBS "${DLCPROOT_LIB_DIR}/libdlcomp.so")
-        include_directories(SYSTEM ${DLCP_INCLUDE_DIR})
-      else()
-        message(STATUS "DLCP not found. DLCP_INCLUDE_DIR = ${DLCPROOT_INCLUDE_DIR} DLCP_LIB_DIR = ${DLCPROOT_LIB_DIR}")
-        message(WARNING "weight grad compression is disabled.")
+        list(APPEND Caffe_LINKER_LIBS "${DLCP_LIBDIR}/libdlcomp.so")
+        include_directories(SYSTEM ${DLCP_INCLDIR})
       endif()
     endif()
-  else()
-    Download_DLCP()
-    if(DLCP_CXX)
-      set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DENABLE_WEIGHT_GRAD_COMPRESSION")
-      list(APPEND Caffe_LINKER_LIBS "${DLCP_LIBDIR}/libdlcomp.so")
-      include_directories(SYSTEM ${DLCP_INCLDIR})
-    endif()
   endif()
 endif()
 
diff --git a/include/caffe/multinode/mlsl.hpp b/include/caffe/multinode/mlsl.hpp
index 9f15a8acf..02360f8c0 100644
--- a/include/caffe/multinode/mlsl.hpp
+++ b/include/caffe/multinode/mlsl.hpp
@@ -398,9 +398,11 @@ namespace caffe {
         get_session().commit();
       }
 
+#ifdef ENABLE_WEIGHT_GRAD_COMPRESSION
       inline void set_quantization_param(MLSL::QuantParams *qparams) {
         MLSL::Environment::GetEnv().SetQuantizationParams(qparams);
       }
+#endif
 
       namespace stats {
         inline void stop() {
@@ -478,10 +480,18 @@ namespace caffe {
       }
       template <typename Dtype>
       void add_parameter_set(int kernelCount, int kernelSize,
-        bool distributedUpdate = false, MLSL::CompressionType compressType = MLSL::CompressionType::CT_NONE)
+        bool distributedUpdate = false
+#ifdef ENABLE_WEIGHT_GRAD_COMPRESSION
+        , MLSL::CompressionType compressType = MLSL::CompressionType::CT_NONE
+#endif
+        )
       {
         opRegInfo_->AddParameterSet(kernelCount, kernelSize, detail::dtype<Dtype>(),
-           distributedUpdate, compressType);
+           distributedUpdate
+#ifdef ENABLE_WEIGHT_GRAD_COMPRESSION
+           , compressType
+#endif
+           );
       }
     private:
       MLSL::OperationRegInfo *opRegInfo_{ nullptr };
diff --git a/include/caffe/multinode/multi_sync.hpp b/include/caffe/multinode/multi_sync.hpp
index 61a79f5a2..969cb53ac 100644
--- a/include/caffe/multinode/multi_sync.hpp
+++ b/include/caffe/multinode/multi_sync.hpp
@@ -200,6 +200,12 @@ namespace caffe {
                    << " ENABLED"
 #else
                    << " DISABLED"
+#endif
+                   << ", WEIGHT GRADIENT COMPRESSION IS"
+#ifdef ENABLE_WEIGHT_GRAD_COMPRESSION
+                   << " ENABLED"
+#else
+                   << " DISABLED"
 #endif
                    << ", SINGLE DB SPLITTING IS"
 #ifdef CAFFE_MLSL_SHUFFLE

From 5e6b19904e702e90bfb7d6d3812d14fa3f0ab26c Mon Sep 17 00:00:00 2001
From: "Zhang, Guoming" <guoming.zhang@intel.com>
Date: Wed, 3 Jan 2018 06:15:38 +0800
Subject: [PATCH 33/53] Add the unit test case for conv/sum/relu fusion.

---
 src/caffe/test/test_net.cpp | 110 ++++++++++++++++++++++++++++++++++++
 1 file changed, 110 insertions(+)

diff --git a/src/caffe/test/test_net.cpp b/src/caffe/test/test_net.cpp
index c62ed6850..53c4e2e1a 100644
--- a/src/caffe/test/test_net.cpp
+++ b/src/caffe/test/test_net.cpp
@@ -3463,6 +3463,116 @@ TEST_F(CompileNetTest, TestCompileNetBatchNormConvolution) {
 }
 #endif
 
+#ifndef DISABLE_CONV_SUM_FUSION
+TEST_F(CompileNetTest, TestCompileNetConvEltReluFusionMKLDNN) {
+
+  const string& input_proto =
+      "name: 'TestNetwork' "
+      "layer { "
+      "  name: 'data' "
+      "  type: 'Data' "
+      "  top: 'data' "
+      "  top: 'label' "
+      "} "
+      "layer { "
+      "  bottom: 'data' "
+      "  name: 'conv1' "
+      "  top: 'conv1' "
+      "  type: 'Convolution' "
+      "  convolution_param { "
+      "   engine: MKLDNN "
+      "  } "
+      "} "
+      "layer { "
+      "  bottom: 'data' "
+      "  name: 'conv2' "
+      "  top: 'conv2' "
+      "  type: 'Convolution' "
+      "  convolution_param { "
+      "   engine: MKLDNN "
+      "  } "
+      "} "
+      "layer { "
+      "  bottom: 'conv1' "
+      "  name: 'conv3' "
+      "  top: 'conv3' "
+      "  type: 'Convolution' "
+      "  convolution_param { "
+      "   engine: MKLDNN "
+      "  } "
+      "} "
+      "layer { "
+      "  bottom: 'conv2' "
+      "  bottom: 'conv3' "
+      "  name: 'conv4' "
+      "  top: 'relu' "
+      "  type: 'Eltwise' "
+      "} "
+      
+      "layer { "
+      " bottom: 'relu' "
+      " top: 'relu' "
+      " name: 'relu' "
+      " type: 'ReLU' "
+      "}"
+
+      "layer { "
+      "  name: 'loss' "
+      "  type: 'SoftmaxWithLoss' "
+      "  bottom: 'relu' "
+      "  bottom: 'label' "
+      "} ";
+
+  const string& output_proto =
+      "name: 'TestNetwork' "
+      "layer { "
+      "  name: 'data' "
+      "  type: 'Data' "
+      "  top: 'data' "
+      "  top: 'label' "
+      "} "
+
+      "layer { "
+      "  bottom: 'data' "
+      "  name: 'conv1' "
+      "  top: 'conv1' "
+      "  type: 'Convolution' "
+      "  convolution_param { "
+      "   engine: MKLDNN "
+      "  } "
+      "} "
+      "layer { "
+      "  bottom: 'data' "
+      "  name: 'conv2' "
+      "  top: 'conv2' "
+      "  type: 'Convolution' "
+      "  convolution_param { "
+      "   engine: MKLDNN "
+      "  } "
+      "} "
+      "layer { "
+      "  bottom: 'conv1' "
+      "  bottom: 'conv2' "
+      "  name: 'conv3' "
+      "  top: 'relu' "
+      "  type: 'Convolution' "
+      "  convolution_param { "
+      "   engine: MKLDNN "
+      "  } "
+      "} "
+      "layer { "
+      "  name: 'loss' "
+      "  type: 'SoftmaxWithLoss' "
+      "  bottom: 'relu' "
+      "  bottom: 'label' "
+      "} ";
+ 
+ const string input_proto_test = "state: { phase: TEST } engine: 'MKLDNN'" + input_proto;
+ const string output_proto_test = "state: { phase: TEST } engine: 'MKLDNN'" + output_proto;
+ this->RunCompilerNetTest(input_proto_test, output_proto_test);
+}
+#endif
+
 #ifdef MKLDNN_SUPPORTED
 // If BatchNorm of engine MKLDNN
 // produce blob consumed by

From c15df526402e671274a3f0fad5b5b90d124631cd Mon Sep 17 00:00:00 2001
From: Shane Li <shane.li@intel.com>
Date: Thu, 28 Dec 2017 14:25:51 +0800
Subject: [PATCH 34/53] Add run_benchmark python script, support scaling test
 and provide config file for user to do flexible configure on benchmarking.
 Change-Id: I0eb7db07477f439899a4cec5c4be432123e4a6d7

---
 .../alexnet/solver_dummydata.prototxt         |   25 +
 .../alexnet/train_val_dummydata.prototxt      |  394 ++
 .../googlenet/solver_dummydata.prototxt       |   25 +
 .../googlenet/train_val_dummydata.prototxt    | 2427 ++++++++++
 .../googlenet_v2/solver_dummydata.prototxt    |   25 +
 .../googlenet_v2/train_val_dummydata.prototxt | 4034 +++++++++++++++++
 .../resnet_50/solver.prototxt                 |   17 +
 .../resnet_50/solver_dummydata.prototxt       |   25 +
 .../resnet_50/train_val.prototxt              | 3322 ++++++++++++++
 .../resnet_50/train_val_dummydata.prototxt    | 3051 +++++++++++++
 scripts/benchmark_config_template.json        |   38 +
 scripts/run_benchmark.py                      |  369 ++
 12 files changed, 13752 insertions(+)
 create mode 100644 models/intel_optimized_models/alexnet/solver_dummydata.prototxt
 create mode 100644 models/intel_optimized_models/alexnet/train_val_dummydata.prototxt
 create mode 100644 models/intel_optimized_models/googlenet/solver_dummydata.prototxt
 create mode 100644 models/intel_optimized_models/googlenet/train_val_dummydata.prototxt
 create mode 100644 models/intel_optimized_models/googlenet_v2/solver_dummydata.prototxt
 create mode 100644 models/intel_optimized_models/googlenet_v2/train_val_dummydata.prototxt
 create mode 100644 models/intel_optimized_models/resnet_50/solver.prototxt
 create mode 100644 models/intel_optimized_models/resnet_50/solver_dummydata.prototxt
 create mode 100644 models/intel_optimized_models/resnet_50/train_val.prototxt
 create mode 100644 models/intel_optimized_models/resnet_50/train_val_dummydata.prototxt
 create mode 100644 scripts/benchmark_config_template.json
 create mode 100755 scripts/run_benchmark.py

diff --git a/models/intel_optimized_models/alexnet/solver_dummydata.prototxt b/models/intel_optimized_models/alexnet/solver_dummydata.prototxt
new file mode 100644
index 000000000..5c15e565e
--- /dev/null
+++ b/models/intel_optimized_models/alexnet/solver_dummydata.prototxt
@@ -0,0 +1,25 @@
+#This is Intel(R) optimized (in terms of time to train) version of solver for model described in the [AlexNet](http://papers.nips.cc/paper/4824-imagenet-classification-with-deep-convolutional-neural-networks) publication.
+#Original solver.prototxt can be found in /models/bvlc_alexnet/ directory of this repository.
+#Differences:
+#- lr_policy is set to poly instead of step
+#- base_lr is decreased to 0.007
+#- max_iter is decreased to 250000
+#- power is set to 0.6
+#
+#Top-5 and Top-1 results achieved with this version of solver:
+#Top-5: 80.4%
+#Top-1: 57.4%
+#Training was performed using server equipped with Intel(R) Xeon Phi(TM) CPU 7250 processor. 
+net: "models/intel_optimized_models/alexnet/train_val_dummydata.prototxt"
+test_iter: 1000
+test_interval: 10000
+base_lr: 0.007
+lr_policy: "poly"
+power: 0.6
+display: 1
+max_iter: 200
+momentum: 0.9
+weight_decay: 0.0005
+snapshot: 50000
+snapshot_prefix: "models/intel_optimized_models/alexnet/alexnet_train"
+solver_mode: CPU
diff --git a/models/intel_optimized_models/alexnet/train_val_dummydata.prototxt b/models/intel_optimized_models/alexnet/train_val_dummydata.prototxt
new file mode 100644
index 000000000..fc47551c3
--- /dev/null
+++ b/models/intel_optimized_models/alexnet/train_val_dummydata.prototxt
@@ -0,0 +1,394 @@
+name: "AlexNet"
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "data"
+  top: "label"
+  include {
+    phase: TRAIN
+  }
+  dummy_data_param {
+    data_filler {
+        type: "constant"
+        value: 0.01
+    }
+    shape: { dim: 256 dim: 3 dim: 224 dim: 224 }
+    shape: { dim: 256 dim: 1 dim: 1   dim: 1   }
+  }
+}
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "data"
+  top: "label"
+  include {
+    phase: TEST
+  }
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+      value: 0.01
+    }
+    shape: { dim: 256 dim: 3 dim: 224 dim: 224 }
+    shape: { dim: 256 dim: 1 dim: 1   dim: 1   }
+  }
+}
+
+layer {
+  name: "conv1"
+  type: "Convolution"
+  bottom: "data"
+  top: "conv1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 96
+    kernel_size: 11
+    stride: 4
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "relu1"
+  type: "ReLU"
+  bottom: "conv1"
+  top: "conv1"
+}
+layer {
+  name: "norm1"
+  type: "LRN"
+  bottom: "conv1"
+  top: "norm1"
+  lrn_param {
+    local_size: 5
+    alpha: 0.0001
+    beta: 0.75
+  }
+}
+layer {
+  name: "pool1"
+  type: "Pooling"
+  bottom: "norm1"
+  top: "pool1"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "conv2"
+  type: "Convolution"
+  bottom: "pool1"
+  top: "conv2"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    pad: 2
+    kernel_size: 5
+    group: 2
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "relu2"
+  type: "ReLU"
+  bottom: "conv2"
+  top: "conv2"
+}
+layer {
+  name: "norm2"
+  type: "LRN"
+  bottom: "conv2"
+  top: "norm2"
+  lrn_param {
+    local_size: 5
+    alpha: 0.0001
+    beta: 0.75
+  }
+}
+layer {
+  name: "pool2"
+  type: "Pooling"
+  bottom: "norm2"
+  top: "pool2"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "conv3"
+  type: "Convolution"
+  bottom: "pool2"
+  top: "conv3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 384
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "relu3"
+  type: "ReLU"
+  bottom: "conv3"
+  top: "conv3"
+}
+layer {
+  name: "conv4"
+  type: "Convolution"
+  bottom: "conv3"
+  top: "conv4"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 384
+    pad: 1
+    kernel_size: 3
+    group: 2
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "relu4"
+  type: "ReLU"
+  bottom: "conv4"
+  top: "conv4"
+}
+layer {
+  name: "conv5"
+  type: "Convolution"
+  bottom: "conv4"
+  top: "conv5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    group: 2
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "relu5"
+  type: "ReLU"
+  bottom: "conv5"
+  top: "conv5"
+}
+layer {
+  name: "pool5"
+  type: "Pooling"
+  bottom: "conv5"
+  top: "pool5"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "fc6"
+  type: "InnerProduct"
+  bottom: "pool5"
+  top: "fc6"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 4096
+    weight_filler {
+      type: "gaussian"
+      std: 0.005
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "relu6"
+  type: "ReLU"
+  bottom: "fc6"
+  top: "fc6"
+}
+layer {
+  name: "drop6"
+  type: "Dropout"
+  bottom: "fc6"
+  top: "fc6"
+  dropout_param {
+    dropout_ratio: 0.5
+  }
+}
+layer {
+  name: "fc7"
+  type: "InnerProduct"
+  bottom: "fc6"
+  top: "fc7"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 4096
+    weight_filler {
+      type: "gaussian"
+      std: 0.005
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "relu7"
+  type: "ReLU"
+  bottom: "fc7"
+  top: "fc7"
+}
+layer {
+  name: "drop7"
+  type: "Dropout"
+  bottom: "fc7"
+  top: "fc7"
+  dropout_param {
+    dropout_ratio: 0.5
+  }
+}
+layer {
+  name: "fc8"
+  type: "InnerProduct"
+  bottom: "fc7"
+  top: "fc8"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "loss"
+  type: "SoftmaxWithLoss"
+  bottom: "fc8"
+  bottom: "label"
+  top: "loss"
+}
+layer {
+  name: "loss3/top-1"
+  type: "Accuracy"
+  bottom: "fc8"
+  bottom: "label"
+  top: "loss3/top-1"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  name: "loss3/top-5"
+  type: "Accuracy"
+  bottom: "fc8"
+  bottom: "label"
+  top: "loss3/top-5"
+  include {
+    phase: TEST
+  }
+  accuracy_param {
+    top_k: 5
+  }
+}
diff --git a/models/intel_optimized_models/googlenet/solver_dummydata.prototxt b/models/intel_optimized_models/googlenet/solver_dummydata.prototxt
new file mode 100644
index 000000000..02ce2018a
--- /dev/null
+++ b/models/intel_optimized_models/googlenet/solver_dummydata.prototxt
@@ -0,0 +1,25 @@
+#This is Intel(R) optimized (in terms of time to train) version of solver for model described in the [AlexNet](http://papers.nips.cc/paper/4824-imagenet-classification-with-deep-convolutional-neural-networks) publication.
+#Original solver.prototxt can be found in /models/bvlc_alexnet/ directory of this repository.
+#Differences:
+#- lr_policy is set to poly instead of step
+#- base_lr is decreased to 0.007
+#- max_iter is decreased to 250000
+#- power is set to 0.6
+#
+#Top-5 and Top-1 results achieved with this version of solver:
+#Top-5: 80.4%
+#Top-1: 57.4%
+#Training was performed using server equipped with Intel(R) Xeon Phi(TM) CPU 7250 processor. 
+net: "models/intel_optimized_models/googlenet/train_val_dummydata.prototxt"
+test_iter: 1000
+test_interval: 10000
+base_lr: 0.007
+lr_policy: "poly"
+power: 0.6
+display: 1
+max_iter: 200
+momentum: 0.9
+weight_decay: 0.0005
+snapshot: 50000
+snapshot_prefix: "models/intel_optimized_models/googlenet/googlenet_train"
+solver_mode: CPU
diff --git a/models/intel_optimized_models/googlenet/train_val_dummydata.prototxt b/models/intel_optimized_models/googlenet/train_val_dummydata.prototxt
new file mode 100644
index 000000000..bf411dfe7
--- /dev/null
+++ b/models/intel_optimized_models/googlenet/train_val_dummydata.prototxt
@@ -0,0 +1,2427 @@
+name: "GoogleNet"
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "data"
+  top: "label"
+  include {
+    phase: TRAIN
+  }
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+      value: 0.01
+    }
+    shape: { dim: 64 dim: 3 dim: 224 dim: 224 }
+    shape: { dim: 64 dim: 1 dim: 1   dim: 1   }
+  }
+}
+
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "data"
+  top: "label"
+  include {
+    phase: TEST
+  }
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+      value: 0.01
+    }
+    shape: { dim: 32 dim: 3 dim: 224 dim: 224 }
+    shape: { dim: 32 dim: 1 dim: 1   dim: 1   }
+  }
+}
+
+layer {
+  name: "conv1/7x7_s2"
+  type: "Convolution"
+  bottom: "data"
+  top: "conv1/7x7_s2"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    pad: 3
+    kernel_size: 7
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "conv1/relu_7x7"
+  type: "ReLU"
+  bottom: "conv1/7x7_s2"
+  top: "conv1/7x7_s2"
+}
+layer {
+  name: "pool1/3x3_s2"
+  type: "Pooling"
+  bottom: "conv1/7x7_s2"
+  top: "pool1/3x3_s2"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "pool1/norm1"
+  type: "LRN"
+  bottom: "pool1/3x3_s2"
+  top: "pool1/norm1"
+  lrn_param {
+    local_size: 5
+    alpha: 0.0001
+    beta: 0.75
+  }
+}
+layer {
+  name: "conv2/3x3_reduce"
+  type: "Convolution"
+  bottom: "pool1/norm1"
+  top: "conv2/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "conv2/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "conv2/3x3_reduce"
+  top: "conv2/3x3_reduce"
+}
+layer {
+  name: "conv2/3x3"
+  type: "Convolution"
+  bottom: "conv2/3x3_reduce"
+  top: "conv2/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 192
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "conv2/relu_3x3"
+  type: "ReLU"
+  bottom: "conv2/3x3"
+  top: "conv2/3x3"
+}
+layer {
+  name: "conv2/norm2"
+  type: "LRN"
+  bottom: "conv2/3x3"
+  top: "conv2/norm2"
+  lrn_param {
+    local_size: 5
+    alpha: 0.0001
+    beta: 0.75
+  }
+}
+layer {
+  name: "pool2/3x3_s2"
+  type: "Pooling"
+  bottom: "conv2/norm2"
+  top: "pool2/3x3_s2"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "inception_3a/1x1"
+  type: "Convolution"
+  bottom: "pool2/3x3_s2"
+  top: "inception_3a/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3a/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_3a/1x1"
+  top: "inception_3a/1x1"
+}
+layer {
+  name: "inception_3a/3x3_reduce"
+  type: "Convolution"
+  bottom: "pool2/3x3_s2"
+  top: "inception_3a/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 96
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3a/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_3a/3x3_reduce"
+  top: "inception_3a/3x3_reduce"
+}
+layer {
+  name: "inception_3a/3x3"
+  type: "Convolution"
+  bottom: "inception_3a/3x3_reduce"
+  top: "inception_3a/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3a/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_3a/3x3"
+  top: "inception_3a/3x3"
+}
+layer {
+  name: "inception_3a/5x5_reduce"
+  type: "Convolution"
+  bottom: "pool2/3x3_s2"
+  top: "inception_3a/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 16
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3a/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_3a/5x5_reduce"
+  top: "inception_3a/5x5_reduce"
+}
+layer {
+  name: "inception_3a/5x5"
+  type: "Convolution"
+  bottom: "inception_3a/5x5_reduce"
+  top: "inception_3a/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 32
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3a/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_3a/5x5"
+  top: "inception_3a/5x5"
+}
+layer {
+  name: "inception_3a/pool"
+  type: "Pooling"
+  bottom: "pool2/3x3_s2"
+  top: "inception_3a/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_3a/pool_proj"
+  type: "Convolution"
+  bottom: "inception_3a/pool"
+  top: "inception_3a/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 32
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3a/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_3a/pool_proj"
+  top: "inception_3a/pool_proj"
+}
+layer {
+  name: "inception_3a/output"
+  type: "Concat"
+  bottom: "inception_3a/1x1"
+  bottom: "inception_3a/3x3"
+  bottom: "inception_3a/5x5"
+  bottom: "inception_3a/pool_proj"
+  top: "inception_3a/output"
+}
+layer {
+  name: "inception_3b/1x1"
+  type: "Convolution"
+  bottom: "inception_3a/output"
+  top: "inception_3b/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3b/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_3b/1x1"
+  top: "inception_3b/1x1"
+}
+layer {
+  name: "inception_3b/3x3_reduce"
+  type: "Convolution"
+  bottom: "inception_3a/output"
+  top: "inception_3b/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3b/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_3b/3x3_reduce"
+  top: "inception_3b/3x3_reduce"
+}
+layer {
+  name: "inception_3b/3x3"
+  type: "Convolution"
+  bottom: "inception_3b/3x3_reduce"
+  top: "inception_3b/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 192
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3b/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_3b/3x3"
+  top: "inception_3b/3x3"
+}
+layer {
+  name: "inception_3b/5x5_reduce"
+  type: "Convolution"
+  bottom: "inception_3a/output"
+  top: "inception_3b/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 32
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3b/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_3b/5x5_reduce"
+  top: "inception_3b/5x5_reduce"
+}
+layer {
+  name: "inception_3b/5x5"
+  type: "Convolution"
+  bottom: "inception_3b/5x5_reduce"
+  top: "inception_3b/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 96
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3b/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_3b/5x5"
+  top: "inception_3b/5x5"
+}
+layer {
+  name: "inception_3b/pool"
+  type: "Pooling"
+  bottom: "inception_3a/output"
+  top: "inception_3b/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_3b/pool_proj"
+  type: "Convolution"
+  bottom: "inception_3b/pool"
+  top: "inception_3b/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_3b/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_3b/pool_proj"
+  top: "inception_3b/pool_proj"
+}
+layer {
+  name: "inception_3b/output"
+  type: "Concat"
+  bottom: "inception_3b/1x1"
+  bottom: "inception_3b/3x3"
+  bottom: "inception_3b/5x5"
+  bottom: "inception_3b/pool_proj"
+  top: "inception_3b/output"
+}
+layer {
+  name: "pool3/3x3_s2"
+  type: "Pooling"
+  bottom: "inception_3b/output"
+  top: "pool3/3x3_s2"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "inception_4a/1x1"
+  type: "Convolution"
+  bottom: "pool3/3x3_s2"
+  top: "inception_4a/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 192
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4a/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_4a/1x1"
+  top: "inception_4a/1x1"
+}
+layer {
+  name: "inception_4a/3x3_reduce"
+  type: "Convolution"
+  bottom: "pool3/3x3_s2"
+  top: "inception_4a/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 96
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4a/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_4a/3x3_reduce"
+  top: "inception_4a/3x3_reduce"
+}
+layer {
+  name: "inception_4a/3x3"
+  type: "Convolution"
+  bottom: "inception_4a/3x3_reduce"
+  top: "inception_4a/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 208
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4a/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_4a/3x3"
+  top: "inception_4a/3x3"
+}
+layer {
+  name: "inception_4a/5x5_reduce"
+  type: "Convolution"
+  bottom: "pool3/3x3_s2"
+  top: "inception_4a/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 16
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4a/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_4a/5x5_reduce"
+  top: "inception_4a/5x5_reduce"
+}
+layer {
+  name: "inception_4a/5x5"
+  type: "Convolution"
+  bottom: "inception_4a/5x5_reduce"
+  top: "inception_4a/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 48
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4a/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_4a/5x5"
+  top: "inception_4a/5x5"
+}
+layer {
+  name: "inception_4a/pool"
+  type: "Pooling"
+  bottom: "pool3/3x3_s2"
+  top: "inception_4a/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_4a/pool_proj"
+  type: "Convolution"
+  bottom: "inception_4a/pool"
+  top: "inception_4a/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4a/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_4a/pool_proj"
+  top: "inception_4a/pool_proj"
+}
+layer {
+  name: "inception_4a/output"
+  type: "Concat"
+  bottom: "inception_4a/1x1"
+  bottom: "inception_4a/3x3"
+  bottom: "inception_4a/5x5"
+  bottom: "inception_4a/pool_proj"
+  top: "inception_4a/output"
+}
+layer {
+  name: "loss1/ave_pool"
+  type: "Pooling"
+  bottom: "inception_4a/output"
+  top: "loss1/ave_pool"
+  pooling_param {
+    pool: AVE
+    kernel_size: 5
+    stride: 3
+  }
+}
+layer {
+  name: "loss1/conv"
+  type: "Convolution"
+  bottom: "loss1/ave_pool"
+  top: "loss1/conv"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "loss1/relu_conv"
+  type: "ReLU"
+  bottom: "loss1/conv"
+  top: "loss1/conv"
+}
+layer {
+  name: "loss1/fc"
+  type: "InnerProduct"
+  bottom: "loss1/conv"
+  top: "loss1/fc"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1024
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "loss1/relu_fc"
+  type: "ReLU"
+  bottom: "loss1/fc"
+  top: "loss1/fc"
+}
+layer {
+  name: "loss1/drop_fc"
+  type: "Dropout"
+  bottom: "loss1/fc"
+  top: "loss1/fc"
+  dropout_param {
+    dropout_ratio: 0.7
+  }
+}
+layer {
+  name: "loss1/classifier"
+  type: "InnerProduct"
+  bottom: "loss1/fc"
+  top: "loss1/classifier"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "loss1/loss"
+  type: "SoftmaxWithLoss"
+  bottom: "loss1/classifier"
+  bottom: "label"
+  top: "loss1/loss1"
+  loss_weight: 0.3
+}
+layer {
+  name: "loss1/top-1"
+  type: "Accuracy"
+  bottom: "loss1/classifier"
+  bottom: "label"
+  top: "loss1/top-1"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  name: "loss1/top-5"
+  type: "Accuracy"
+  bottom: "loss1/classifier"
+  bottom: "label"
+  top: "loss1/top-5"
+  include {
+    phase: TEST
+  }
+  accuracy_param {
+    top_k: 5
+  }
+}
+layer {
+  name: "inception_4b/1x1"
+  type: "Convolution"
+  bottom: "inception_4a/output"
+  top: "inception_4b/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 160
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4b/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_4b/1x1"
+  top: "inception_4b/1x1"
+}
+layer {
+  name: "inception_4b/3x3_reduce"
+  type: "Convolution"
+  bottom: "inception_4a/output"
+  top: "inception_4b/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 112
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4b/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_4b/3x3_reduce"
+  top: "inception_4b/3x3_reduce"
+}
+layer {
+  name: "inception_4b/3x3"
+  type: "Convolution"
+  bottom: "inception_4b/3x3_reduce"
+  top: "inception_4b/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 224
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4b/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_4b/3x3"
+  top: "inception_4b/3x3"
+}
+layer {
+  name: "inception_4b/5x5_reduce"
+  type: "Convolution"
+  bottom: "inception_4a/output"
+  top: "inception_4b/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 24
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4b/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_4b/5x5_reduce"
+  top: "inception_4b/5x5_reduce"
+}
+layer {
+  name: "inception_4b/5x5"
+  type: "Convolution"
+  bottom: "inception_4b/5x5_reduce"
+  top: "inception_4b/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4b/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_4b/5x5"
+  top: "inception_4b/5x5"
+}
+layer {
+  name: "inception_4b/pool"
+  type: "Pooling"
+  bottom: "inception_4a/output"
+  top: "inception_4b/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_4b/pool_proj"
+  type: "Convolution"
+  bottom: "inception_4b/pool"
+  top: "inception_4b/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4b/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_4b/pool_proj"
+  top: "inception_4b/pool_proj"
+}
+layer {
+  name: "inception_4b/output"
+  type: "Concat"
+  bottom: "inception_4b/1x1"
+  bottom: "inception_4b/3x3"
+  bottom: "inception_4b/5x5"
+  bottom: "inception_4b/pool_proj"
+  top: "inception_4b/output"
+}
+layer {
+  name: "inception_4c/1x1"
+  type: "Convolution"
+  bottom: "inception_4b/output"
+  top: "inception_4c/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4c/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_4c/1x1"
+  top: "inception_4c/1x1"
+}
+layer {
+  name: "inception_4c/3x3_reduce"
+  type: "Convolution"
+  bottom: "inception_4b/output"
+  top: "inception_4c/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4c/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_4c/3x3_reduce"
+  top: "inception_4c/3x3_reduce"
+}
+layer {
+  name: "inception_4c/3x3"
+  type: "Convolution"
+  bottom: "inception_4c/3x3_reduce"
+  top: "inception_4c/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4c/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_4c/3x3"
+  top: "inception_4c/3x3"
+}
+layer {
+  name: "inception_4c/5x5_reduce"
+  type: "Convolution"
+  bottom: "inception_4b/output"
+  top: "inception_4c/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 24
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4c/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_4c/5x5_reduce"
+  top: "inception_4c/5x5_reduce"
+}
+layer {
+  name: "inception_4c/5x5"
+  type: "Convolution"
+  bottom: "inception_4c/5x5_reduce"
+  top: "inception_4c/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4c/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_4c/5x5"
+  top: "inception_4c/5x5"
+}
+layer {
+  name: "inception_4c/pool"
+  type: "Pooling"
+  bottom: "inception_4b/output"
+  top: "inception_4c/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_4c/pool_proj"
+  type: "Convolution"
+  bottom: "inception_4c/pool"
+  top: "inception_4c/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4c/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_4c/pool_proj"
+  top: "inception_4c/pool_proj"
+}
+layer {
+  name: "inception_4c/output"
+  type: "Concat"
+  bottom: "inception_4c/1x1"
+  bottom: "inception_4c/3x3"
+  bottom: "inception_4c/5x5"
+  bottom: "inception_4c/pool_proj"
+  top: "inception_4c/output"
+}
+layer {
+  name: "inception_4d/1x1"
+  type: "Convolution"
+  bottom: "inception_4c/output"
+  top: "inception_4d/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 112
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4d/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_4d/1x1"
+  top: "inception_4d/1x1"
+}
+layer {
+  name: "inception_4d/3x3_reduce"
+  type: "Convolution"
+  bottom: "inception_4c/output"
+  top: "inception_4d/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 144
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4d/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_4d/3x3_reduce"
+  top: "inception_4d/3x3_reduce"
+}
+layer {
+  name: "inception_4d/3x3"
+  type: "Convolution"
+  bottom: "inception_4d/3x3_reduce"
+  top: "inception_4d/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 288
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4d/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_4d/3x3"
+  top: "inception_4d/3x3"
+}
+layer {
+  name: "inception_4d/5x5_reduce"
+  type: "Convolution"
+  bottom: "inception_4c/output"
+  top: "inception_4d/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 32
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4d/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_4d/5x5_reduce"
+  top: "inception_4d/5x5_reduce"
+}
+layer {
+  name: "inception_4d/5x5"
+  type: "Convolution"
+  bottom: "inception_4d/5x5_reduce"
+  top: "inception_4d/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4d/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_4d/5x5"
+  top: "inception_4d/5x5"
+}
+layer {
+  name: "inception_4d/pool"
+  type: "Pooling"
+  bottom: "inception_4c/output"
+  top: "inception_4d/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_4d/pool_proj"
+  type: "Convolution"
+  bottom: "inception_4d/pool"
+  top: "inception_4d/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4d/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_4d/pool_proj"
+  top: "inception_4d/pool_proj"
+}
+layer {
+  name: "inception_4d/output"
+  type: "Concat"
+  bottom: "inception_4d/1x1"
+  bottom: "inception_4d/3x3"
+  bottom: "inception_4d/5x5"
+  bottom: "inception_4d/pool_proj"
+  top: "inception_4d/output"
+}
+layer {
+  name: "loss2/ave_pool"
+  type: "Pooling"
+  bottom: "inception_4d/output"
+  top: "loss2/ave_pool"
+  pooling_param {
+    pool: AVE
+    kernel_size: 5
+    stride: 3
+  }
+}
+layer {
+  name: "loss2/conv"
+  type: "Convolution"
+  bottom: "loss2/ave_pool"
+  top: "loss2/conv"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "loss2/relu_conv"
+  type: "ReLU"
+  bottom: "loss2/conv"
+  top: "loss2/conv"
+}
+layer {
+  name: "loss2/fc"
+  type: "InnerProduct"
+  bottom: "loss2/conv"
+  top: "loss2/fc"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1024
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "loss2/relu_fc"
+  type: "ReLU"
+  bottom: "loss2/fc"
+  top: "loss2/fc"
+}
+layer {
+  name: "loss2/drop_fc"
+  type: "Dropout"
+  bottom: "loss2/fc"
+  top: "loss2/fc"
+  dropout_param {
+    dropout_ratio: 0.7
+  }
+}
+layer {
+  name: "loss2/classifier"
+  type: "InnerProduct"
+  bottom: "loss2/fc"
+  top: "loss2/classifier"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "loss2/loss"
+  type: "SoftmaxWithLoss"
+  bottom: "loss2/classifier"
+  bottom: "label"
+  top: "loss2/loss1"
+  loss_weight: 0.3
+}
+layer {
+  name: "loss2/top-1"
+  type: "Accuracy"
+  bottom: "loss2/classifier"
+  bottom: "label"
+  top: "loss2/top-1"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  name: "loss2/top-5"
+  type: "Accuracy"
+  bottom: "loss2/classifier"
+  bottom: "label"
+  top: "loss2/top-5"
+  include {
+    phase: TEST
+  }
+  accuracy_param {
+    top_k: 5
+  }
+}
+layer {
+  name: "inception_4e/1x1"
+  type: "Convolution"
+  bottom: "inception_4d/output"
+  top: "inception_4e/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4e/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_4e/1x1"
+  top: "inception_4e/1x1"
+}
+layer {
+  name: "inception_4e/3x3_reduce"
+  type: "Convolution"
+  bottom: "inception_4d/output"
+  top: "inception_4e/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 160
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4e/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_4e/3x3_reduce"
+  top: "inception_4e/3x3_reduce"
+}
+layer {
+  name: "inception_4e/3x3"
+  type: "Convolution"
+  bottom: "inception_4e/3x3_reduce"
+  top: "inception_4e/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 320
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4e/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_4e/3x3"
+  top: "inception_4e/3x3"
+}
+layer {
+  name: "inception_4e/5x5_reduce"
+  type: "Convolution"
+  bottom: "inception_4d/output"
+  top: "inception_4e/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 32
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4e/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_4e/5x5_reduce"
+  top: "inception_4e/5x5_reduce"
+}
+layer {
+  name: "inception_4e/5x5"
+  type: "Convolution"
+  bottom: "inception_4e/5x5_reduce"
+  top: "inception_4e/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4e/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_4e/5x5"
+  top: "inception_4e/5x5"
+}
+layer {
+  name: "inception_4e/pool"
+  type: "Pooling"
+  bottom: "inception_4d/output"
+  top: "inception_4e/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_4e/pool_proj"
+  type: "Convolution"
+  bottom: "inception_4e/pool"
+  top: "inception_4e/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_4e/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_4e/pool_proj"
+  top: "inception_4e/pool_proj"
+}
+layer {
+  name: "inception_4e/output"
+  type: "Concat"
+  bottom: "inception_4e/1x1"
+  bottom: "inception_4e/3x3"
+  bottom: "inception_4e/5x5"
+  bottom: "inception_4e/pool_proj"
+  top: "inception_4e/output"
+}
+layer {
+  name: "pool4/3x3_s2"
+  type: "Pooling"
+  bottom: "inception_4e/output"
+  top: "pool4/3x3_s2"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "inception_5a/1x1"
+  type: "Convolution"
+  bottom: "pool4/3x3_s2"
+  top: "inception_5a/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5a/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_5a/1x1"
+  top: "inception_5a/1x1"
+}
+layer {
+  name: "inception_5a/3x3_reduce"
+  type: "Convolution"
+  bottom: "pool4/3x3_s2"
+  top: "inception_5a/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 160
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5a/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_5a/3x3_reduce"
+  top: "inception_5a/3x3_reduce"
+}
+layer {
+  name: "inception_5a/3x3"
+  type: "Convolution"
+  bottom: "inception_5a/3x3_reduce"
+  top: "inception_5a/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 320
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5a/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_5a/3x3"
+  top: "inception_5a/3x3"
+}
+layer {
+  name: "inception_5a/5x5_reduce"
+  type: "Convolution"
+  bottom: "pool4/3x3_s2"
+  top: "inception_5a/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 32
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5a/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_5a/5x5_reduce"
+  top: "inception_5a/5x5_reduce"
+}
+layer {
+  name: "inception_5a/5x5"
+  type: "Convolution"
+  bottom: "inception_5a/5x5_reduce"
+  top: "inception_5a/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5a/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_5a/5x5"
+  top: "inception_5a/5x5"
+}
+layer {
+  name: "inception_5a/pool"
+  type: "Pooling"
+  bottom: "pool4/3x3_s2"
+  top: "inception_5a/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_5a/pool_proj"
+  type: "Convolution"
+  bottom: "inception_5a/pool"
+  top: "inception_5a/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5a/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_5a/pool_proj"
+  top: "inception_5a/pool_proj"
+}
+layer {
+  name: "inception_5a/output"
+  type: "Concat"
+  bottom: "inception_5a/1x1"
+  bottom: "inception_5a/3x3"
+  bottom: "inception_5a/5x5"
+  bottom: "inception_5a/pool_proj"
+  top: "inception_5a/output"
+}
+layer {
+  name: "inception_5b/1x1"
+  type: "Convolution"
+  bottom: "inception_5a/output"
+  top: "inception_5b/1x1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 384
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5b/relu_1x1"
+  type: "ReLU"
+  bottom: "inception_5b/1x1"
+  top: "inception_5b/1x1"
+}
+layer {
+  name: "inception_5b/3x3_reduce"
+  type: "Convolution"
+  bottom: "inception_5a/output"
+  top: "inception_5b/3x3_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 192
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5b/relu_3x3_reduce"
+  type: "ReLU"
+  bottom: "inception_5b/3x3_reduce"
+  top: "inception_5b/3x3_reduce"
+}
+layer {
+  name: "inception_5b/3x3"
+  type: "Convolution"
+  bottom: "inception_5b/3x3_reduce"
+  top: "inception_5b/3x3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 384
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5b/relu_3x3"
+  type: "ReLU"
+  bottom: "inception_5b/3x3"
+  top: "inception_5b/3x3"
+}
+layer {
+  name: "inception_5b/5x5_reduce"
+  type: "Convolution"
+  bottom: "inception_5a/output"
+  top: "inception_5b/5x5_reduce"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 48
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5b/relu_5x5_reduce"
+  type: "ReLU"
+  bottom: "inception_5b/5x5_reduce"
+  top: "inception_5b/5x5_reduce"
+}
+layer {
+  name: "inception_5b/5x5"
+  type: "Convolution"
+  bottom: "inception_5b/5x5_reduce"
+  top: "inception_5b/5x5"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    pad: 2
+    kernel_size: 5
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5b/relu_5x5"
+  type: "ReLU"
+  bottom: "inception_5b/5x5"
+  top: "inception_5b/5x5"
+}
+layer {
+  name: "inception_5b/pool"
+  type: "Pooling"
+  bottom: "inception_5a/output"
+  top: "inception_5b/pool"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+  name: "inception_5b/pool_proj"
+  type: "Convolution"
+  bottom: "inception_5b/pool"
+  top: "inception_5b/pool_proj"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.1
+    }
+  }
+}
+layer {
+  name: "inception_5b/relu_pool_proj"
+  type: "ReLU"
+  bottom: "inception_5b/pool_proj"
+  top: "inception_5b/pool_proj"
+}
+layer {
+  name: "inception_5b/output"
+  type: "Concat"
+  bottom: "inception_5b/1x1"
+  bottom: "inception_5b/3x3"
+  bottom: "inception_5b/5x5"
+  bottom: "inception_5b/pool_proj"
+  top: "inception_5b/output"
+}
+layer {
+  name: "pool5/7x7_s1"
+  type: "Pooling"
+  bottom: "inception_5b/output"
+  top: "pool5/7x7_s1"
+  pooling_param {
+    pool: AVE
+    kernel_size: 7
+    stride: 1
+  }
+}
+layer {
+  name: "pool5/drop_7x7_s1"
+  type: "Dropout"
+  bottom: "pool5/7x7_s1"
+  top: "pool5/7x7_s1"
+  dropout_param {
+    dropout_ratio: 0.4
+  }
+}
+layer {
+  name: "loss3/classifier"
+  type: "InnerProduct"
+  bottom: "pool5/7x7_s1"
+  top: "loss3/classifier"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "loss3/loss3"
+  type: "SoftmaxWithLoss"
+  bottom: "loss3/classifier"
+  bottom: "label"
+  top: "loss3/loss3"
+  loss_weight: 1
+}
+layer {
+  name: "loss3/top-1"
+  type: "Accuracy"
+  bottom: "loss3/classifier"
+  bottom: "label"
+  top: "loss3/top-1"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  name: "loss3/top-5"
+  type: "Accuracy"
+  bottom: "loss3/classifier"
+  bottom: "label"
+  top: "loss3/top-5"
+  include {
+    phase: TEST
+  }
+  accuracy_param {
+    top_k: 5
+  }
+}
diff --git a/models/intel_optimized_models/googlenet_v2/solver_dummydata.prototxt b/models/intel_optimized_models/googlenet_v2/solver_dummydata.prototxt
new file mode 100644
index 000000000..9162b472c
--- /dev/null
+++ b/models/intel_optimized_models/googlenet_v2/solver_dummydata.prototxt
@@ -0,0 +1,25 @@
+#This is Intel(R) optimized (in terms of time to train) version of solver for model described in the [AlexNet](http://papers.nips.cc/paper/4824-imagenet-classification-with-deep-convolutional-neural-networks) publication.
+#Original solver.prototxt can be found in /models/bvlc_alexnet/ directory of this repository.
+#Differences:
+#- lr_policy is set to poly instead of step
+#- base_lr is decreased to 0.007
+#- max_iter is decreased to 250000
+#- power is set to 0.6
+#
+#Top-5 and Top-1 results achieved with this version of solver:
+#Top-5: 80.4%
+#Top-1: 57.4%
+#Training was performed using server equipped with Intel(R) Xeon Phi(TM) CPU 7250 processor. 
+net: "models/intel_optimized_models/googlenet_v2/train_val_dummydata.prototxt"
+test_iter: 1000
+test_interval: 10000
+base_lr: 0.007
+lr_policy: "poly"
+power: 0.6
+display: 1
+max_iter: 5000
+momentum: 0.9
+weight_decay: 0.0005
+snapshot: 50000
+snapshot_prefix: "models/intel_optimized_models/googlenet_v2/googlenet_train"
+solver_mode: CPU
diff --git a/models/intel_optimized_models/googlenet_v2/train_val_dummydata.prototxt b/models/intel_optimized_models/googlenet_v2/train_val_dummydata.prototxt
new file mode 100644
index 000000000..2908c3841
--- /dev/null
+++ b/models/intel_optimized_models/googlenet_v2/train_val_dummydata.prototxt
@@ -0,0 +1,4034 @@
+# Inception Network (GoogLeNet Batch Normalization Network)
+name: "InceptionNetwork"
+### Training Set
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "data"
+  top: "label"
+  include {
+    phase: TRAIN
+  }
+  dummy_data_param {
+    data_filler {
+        type: "constant"
+        value: 0.01
+    }
+    shape: { dim: 96 dim: 3 dim: 224 dim: 224 }
+    shape: { dim: 96 dim: 1 dim: 1   dim: 1   }
+  }
+}
+
+### Validation Set
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "data"
+  top: "label"
+  include {
+    phase: TEST
+  }
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+      value: 0.01
+    }
+    shape: { dim: 32 dim: 3 dim: 224 dim: 224 }
+    shape: { dim: 32 dim: 1 dim: 1   dim: 1   }
+  }
+}
+
+layer {
+  bottom: "data"
+  top: "conv1/7x7_s2"
+  name: "conv1/7x7_s2"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 64
+    pad: 3
+    kernel_size: 7
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "conv1/7x7_s2"
+  name: "conv1/7x7_s2/bn"
+  top: "conv1/7x7_s2/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "conv1/7x7_s2/bn"
+  top: "conv1/7x7_s2/bn/sc"
+  name: "conv1/7x7_s2/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "conv1/7x7_s2/bn/sc"
+  top: "conv1/7x7_s2/bn/sc"
+  name: "conv1/7x7_s2/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv1/7x7_s2/bn/sc"
+  top: "pool1/3x3_s2"
+  name: "pool1/3x3_s2"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+ bottom: "pool1/3x3_s2"
+  top: "conv2/3x3_reduce"
+  name: "conv2/3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 64
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "conv2/3x3_reduce"
+  name: "conv2/3x3_reduce/bn"
+  top: "conv2/3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "conv2/3x3_reduce/bn"
+  top: "conv2/3x3_reduce/bn/sc"
+  name: "conv2/3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "conv2/3x3_reduce/bn/sc"
+  top: "conv2/3x3_reduce/bn/sc"
+  name: "conv2/3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "conv2/3x3_reduce/bn/sc"
+  top: "conv2/3x3"
+  name: "conv2/3x3"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 192
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "conv2/3x3"
+  name: "conv2/3x3/bn"
+  top: "conv2/3x3/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "conv2/3x3/bn"
+  top: "conv2/3x3/bn/sc"
+  name: "conv2/3x3/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "conv2/3x3/bn/sc"
+  top: "conv2/3x3/bn/sc"
+  name: "conv2/3x3/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "conv2/3x3/bn/sc"
+  top: "pool2/3x3_s2"
+  name: "pool2/3x3_s2"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+ bottom: "pool2/3x3_s2"
+  top: "inception_3a/1x1"
+  name: "inception_3a/1x1"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 64
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3a/1x1"
+  name: "inception_3a/1x1/bn"
+  top: "inception_3a/1x1/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3a/1x1/bn"
+  top: "inception_3a/1x1/bn/sc"
+  name: "inception_3a/1x1/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3a/1x1/bn/sc"
+  top: "inception_3a/1x1/bn/sc"
+  name: "inception_3a/1x1/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "pool2/3x3_s2"
+  top: "inception_3a/3x3_reduce"
+  name: "inception_3a/3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 64
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3a/3x3_reduce"
+  name: "inception_3a/3x3_reduce/bn"
+  top: "inception_3a/3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3a/3x3_reduce/bn"
+  top: "inception_3a/3x3_reduce/bn/sc"
+  name: "inception_3a/3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3a/3x3_reduce/bn/sc"
+  top: "inception_3a/3x3_reduce/bn/sc"
+  name: "inception_3a/3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3a/3x3_reduce/bn/sc"
+  top: "inception_3a/3x3"
+  name: "inception_3a/3x3"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 64
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3a/3x3"
+  name: "inception_3a/3x3/bn"
+  top: "inception_3a/3x3/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3a/3x3/bn"
+  top: "inception_3a/3x3/bn/sc"
+  name: "inception_3a/3x3/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3a/3x3/bn/sc"
+  top: "inception_3a/3x3/bn/sc"
+  name: "inception_3a/3x3/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "pool2/3x3_s2"
+  top: "inception_3a/double3x3_reduce"
+  name: "inception_3a/double3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 64
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3a/double3x3_reduce"
+  name: "inception_3a/double3x3_reduce/bn"
+  top: "inception_3a/double3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3a/double3x3_reduce/bn"
+  top: "inception_3a/double3x3_reduce/bn/sc"
+  name: "inception_3a/double3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3a/double3x3_reduce/bn/sc"
+  top: "inception_3a/double3x3_reduce/bn/sc"
+  name: "inception_3a/double3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3a/double3x3_reduce/bn/sc"
+  top: "inception_3a/double3x3a"
+  name: "inception_3a/double3x3a"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3a/double3x3a"
+  name: "inception_3a/double3x3a/bn"
+  top: "inception_3a/double3x3a/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3a/double3x3a/bn"
+  top: "inception_3a/double3x3a/bn/sc"
+  name: "inception_3a/double3x3a/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3a/double3x3a/bn/sc"
+  top: "inception_3a/double3x3a/bn/sc"
+  name: "inception_3a/double3x3a/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3a/double3x3a/bn/sc"
+  top: "inception_3a/double3x3b"
+  name: "inception_3a/double3x3b"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3a/double3x3b"
+  name: "inception_3a/double3x3b/bn"
+  top: "inception_3a/double3x3b/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3a/double3x3b/bn"
+  top: "inception_3a/double3x3b/bn/sc"
+  name: "inception_3a/double3x3b/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3a/double3x3b/bn/sc"
+  top: "inception_3a/double3x3b/bn/sc"
+  name: "inception_3a/double3x3b/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "pool2/3x3_s2"
+  top: "inception_3a/pool"
+  name: "inception_3a/pool"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: AVE
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+ bottom: "inception_3a/pool"
+  top: "inception_3a/pool_proj"
+  name: "inception_3a/pool_proj"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 32
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3a/pool_proj"
+  name: "inception_3a/pool_proj/bn"
+  top: "inception_3a/pool_proj/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3a/pool_proj/bn"
+  top: "inception_3a/pool_proj/bn/sc"
+  name: "inception_3a/pool_proj/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3a/pool_proj/bn/sc"
+  top: "inception_3a/pool_proj/bn/sc"
+  name: "inception_3a/pool_proj/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3a/1x1/bn/sc"
+  bottom: "inception_3a/3x3/bn/sc"
+  bottom: "inception_3a/double3x3b/bn/sc"
+  bottom: "inception_3a/pool_proj/bn/sc"
+  top: "inception_3a/output"
+  name: "inception_3a/output"
+  type: "Concat"
+  concat_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3a/output"
+  top: "inception_3b/1x1"
+  name: "inception_3b/1x1"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 64
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3b/1x1"
+  name: "inception_3b/1x1/bn"
+  top: "inception_3b/1x1/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3b/1x1/bn"
+  top: "inception_3b/1x1/bn/sc"
+  name: "inception_3b/1x1/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3b/1x1/bn/sc"
+  top: "inception_3b/1x1/bn/sc"
+  name: "inception_3b/1x1/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3a/output"
+  top: "inception_3b/3x3_reduce"
+  name: "inception_3b/3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 64
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3b/3x3_reduce"
+  name: "inception_3b/3x3_reduce/bn"
+  top: "inception_3b/3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3b/3x3_reduce/bn"
+  top: "inception_3b/3x3_reduce/bn/sc"
+  name: "inception_3b/3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3b/3x3_reduce/bn/sc"
+  top: "inception_3b/3x3_reduce/bn/sc"
+  name: "inception_3b/3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3b/3x3_reduce/bn/sc"
+  top: "inception_3b/3x3"
+  name: "inception_3b/3x3"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3b/3x3"
+  name: "inception_3b/3x3/bn"
+  top: "inception_3b/3x3/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3b/3x3/bn"
+  top: "inception_3b/3x3/bn/sc"
+  name: "inception_3b/3x3/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3b/3x3/bn/sc"
+  top: "inception_3b/3x3/bn/sc"
+  name: "inception_3b/3x3/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3a/output"
+  top: "inception_3b/double3x3_reduce"
+  name: "inception_3b/double3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 64
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3b/double3x3_reduce"
+  name: "inception_3b/double3x3_reduce/bn"
+  top: "inception_3b/double3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3b/double3x3_reduce/bn"
+  top: "inception_3b/double3x3_reduce/bn/sc"
+  name: "inception_3b/double3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3b/double3x3_reduce/bn/sc"
+  top: "inception_3b/double3x3_reduce/bn/sc"
+  name: "inception_3b/double3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3b/double3x3_reduce/bn/sc"
+  top: "inception_3b/double3x3a"
+  name: "inception_3b/double3x3a"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3b/double3x3a"
+  name: "inception_3b/double3x3a/bn"
+  top: "inception_3b/double3x3a/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3b/double3x3a/bn"
+  top: "inception_3b/double3x3a/bn/sc"
+  name: "inception_3b/double3x3a/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3b/double3x3a/bn/sc"
+  top: "inception_3b/double3x3a/bn/sc"
+  name: "inception_3b/double3x3a/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3b/double3x3a/bn/sc"
+  top: "inception_3b/double3x3b"
+  name: "inception_3b/double3x3b"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3b/double3x3b"
+  name: "inception_3b/double3x3b/bn"
+  top: "inception_3b/double3x3b/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3b/double3x3b/bn"
+  top: "inception_3b/double3x3b/bn/sc"
+  name: "inception_3b/double3x3b/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3b/double3x3b/bn/sc"
+  top: "inception_3b/double3x3b/bn/sc"
+  name: "inception_3b/double3x3b/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3a/output"
+  top: "inception_3b/pool"
+  name: "inception_3b/pool"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: AVE
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+ bottom: "inception_3b/pool"
+  top: "inception_3b/pool_proj"
+  name: "inception_3b/pool_proj"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 64
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3b/pool_proj"
+  name: "inception_3b/pool_proj/bn"
+  top: "inception_3b/pool_proj/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3b/pool_proj/bn"
+  top: "inception_3b/pool_proj/bn/sc"
+  name: "inception_3b/pool_proj/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3b/pool_proj/bn/sc"
+  top: "inception_3b/pool_proj/bn/sc"
+  name: "inception_3b/pool_proj/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3b/1x1/bn/sc"
+  bottom: "inception_3b/3x3/bn/sc"
+  bottom: "inception_3b/double3x3b/bn/sc"
+  bottom: "inception_3b/pool_proj/bn/sc"
+  top: "inception_3b/output"
+  name: "inception_3b/output"
+  type: "Concat"
+  concat_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3b/output"
+  top: "inception_3c/3x3_reduce"
+  name: "inception_3c/3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3c/3x3_reduce"
+  name: "inception_3c/3x3_reduce/bn"
+  top: "inception_3c/3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3c/3x3_reduce/bn"
+  top: "inception_3c/3x3_reduce/bn/sc"
+  name: "inception_3c/3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3c/3x3_reduce/bn/sc"
+  top: "inception_3c/3x3_reduce/bn/sc"
+  name: "inception_3c/3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3c/3x3_reduce/bn/sc"
+  top: "inception_3c/3x3"
+  name: "inception_3c/3x3"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 160
+    pad: 1
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3c/3x3"
+  name: "inception_3c/3x3/bn"
+  top: "inception_3c/3x3/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3c/3x3/bn"
+  top: "inception_3c/3x3/bn/sc"
+  name: "inception_3c/3x3/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3c/3x3/bn/sc"
+  top: "inception_3c/3x3/bn/sc"
+  name: "inception_3c/3x3/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3b/output"
+  top: "inception_3c/double3x3_reduce"
+  name: "inception_3c/double3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 64
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3c/double3x3_reduce"
+  name: "inception_3c/double3x3_reduce/bn"
+  top: "inception_3c/double3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3c/double3x3_reduce/bn"
+  top: "inception_3c/double3x3_reduce/bn/sc"
+  name: "inception_3c/double3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3c/double3x3_reduce/bn/sc"
+  top: "inception_3c/double3x3_reduce/bn/sc"
+  name: "inception_3c/double3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3c/double3x3_reduce/bn/sc"
+  top: "inception_3c/double3x3a"
+  name: "inception_3c/double3x3a"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3c/double3x3a"
+  name: "inception_3c/double3x3a/bn"
+  top: "inception_3c/double3x3a/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3c/double3x3a/bn"
+  top: "inception_3c/double3x3a/bn/sc"
+  name: "inception_3c/double3x3a/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3c/double3x3a/bn/sc"
+  top: "inception_3c/double3x3a/bn/sc"
+  name: "inception_3c/double3x3a/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3c/double3x3a/bn/sc"
+  top: "inception_3c/double3x3b"
+  name: "inception_3c/double3x3b"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 1
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_3c/double3x3b"
+  name: "inception_3c/double3x3b/bn"
+  top: "inception_3c/double3x3b/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3c/double3x3b/bn"
+  top: "inception_3c/double3x3b/bn/sc"
+  name: "inception_3c/double3x3b/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_3c/double3x3b/bn/sc"
+  top: "inception_3c/double3x3b/bn/sc"
+  name: "inception_3c/double3x3b/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3b/output"
+  top: "inception_3c/pool"
+  name: "inception_3c/pool"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  bottom: "inception_3c/3x3/bn/sc"
+  bottom: "inception_3c/double3x3b/bn/sc"
+  bottom: "inception_3c/pool"
+  top: "inception_3c/output"
+  name: "inception_3c/output"
+  type: "Concat"
+  concat_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3c/output"
+  top: "pool3/5x5_s3"
+  name: "pool3/5x5_s3"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: AVE
+    kernel_size: 5
+    stride: 3
+  }
+}
+layer {
+ bottom: "pool3/5x5_s3"
+  top: "loss1/conv"
+  name: "loss1/conv"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "loss1/conv"
+  name: "loss1/conv/bn"
+  top: "loss1/conv/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "loss1/conv/bn"
+  top: "loss1/conv/bn/sc"
+  name: "loss1/conv/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "loss1/conv/bn/sc"
+  top: "loss1/conv/bn/sc"
+  name: "loss1/conv/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "loss1/conv/bn/sc"
+  top: "loss1/fc"
+  name: "loss1/fc"
+  type: "InnerProduct"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  inner_product_param {
+    num_output: 1024
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "loss1/fc"
+  name: "loss1/fc/bn"
+  top: "loss1/fc/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "loss1/fc/bn"
+  top: "loss1/fc/bn/sc"
+  name: "loss1/fc/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "loss1/fc/bn/sc"
+  top: "loss1/fc/bn/sc"
+  name: "loss1/fc/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "loss1/fc/bn/sc"
+  top: "loss1/classifier"
+  name: "loss1/classifier"
+  type: "InnerProduct"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  bottom: "loss1/classifier"
+  bottom: "label"
+  top: "loss1/loss"
+  name: "loss1/loss"
+  type: "SoftmaxWithLoss"
+  loss_weight: 0.3
+}
+layer {
+  bottom: "loss1/classifier"
+  top: "loss1/prob"
+  name: "loss1/prob"
+  type: "Softmax"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  bottom: "loss1/prob"
+  bottom: "label"
+  top: "loss1/top-1"
+  name: "loss1/top-1"
+  type: "Accuracy"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  bottom: "loss1/prob"
+  bottom: "label"
+  top: "loss1/top-5"
+  name: "loss1/top-5"
+  type: "Accuracy"
+  accuracy_param {
+    top_k: 5
+  }
+  include {
+    phase: TEST
+  }
+}
+layer {
+ bottom: "inception_3c/output"
+  top: "inception_4a/1x1"
+  name: "inception_4a/1x1"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 224
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4a/1x1"
+  name: "inception_4a/1x1/bn"
+  top: "inception_4a/1x1/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4a/1x1/bn"
+  top: "inception_4a/1x1/bn/sc"
+  name: "inception_4a/1x1/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4a/1x1/bn/sc"
+  top: "inception_4a/1x1/bn/sc"
+  name: "inception_4a/1x1/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3c/output"
+  top: "inception_4a/3x3_reduce"
+  name: "inception_4a/3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 64
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4a/3x3_reduce"
+  name: "inception_4a/3x3_reduce/bn"
+  top: "inception_4a/3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4a/3x3_reduce/bn"
+  top: "inception_4a/3x3_reduce/bn/sc"
+  name: "inception_4a/3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4a/3x3_reduce/bn/sc"
+  top: "inception_4a/3x3_reduce/bn/sc"
+  name: "inception_4a/3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4a/3x3_reduce/bn/sc"
+  top: "inception_4a/3x3"
+  name: "inception_4a/3x3"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4a/3x3"
+  name: "inception_4a/3x3/bn"
+  top: "inception_4a/3x3/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4a/3x3/bn"
+  top: "inception_4a/3x3/bn/sc"
+  name: "inception_4a/3x3/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4a/3x3/bn/sc"
+  top: "inception_4a/3x3/bn/sc"
+  name: "inception_4a/3x3/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_3c/output"
+  top: "inception_4a/double3x3_reduce"
+  name: "inception_4a/double3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4a/double3x3_reduce"
+  name: "inception_4a/double3x3_reduce/bn"
+  top: "inception_4a/double3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4a/double3x3_reduce/bn"
+  top: "inception_4a/double3x3_reduce/bn/sc"
+  name: "inception_4a/double3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4a/double3x3_reduce/bn/sc"
+  top: "inception_4a/double3x3_reduce/bn/sc"
+  name: "inception_4a/double3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4a/double3x3_reduce/bn/sc"
+  top: "inception_4a/double3x3a"
+  name: "inception_4a/double3x3a"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4a/double3x3a"
+  name: "inception_4a/double3x3a/bn"
+  top: "inception_4a/double3x3a/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4a/double3x3a/bn"
+  top: "inception_4a/double3x3a/bn/sc"
+  name: "inception_4a/double3x3a/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4a/double3x3a/bn/sc"
+  top: "inception_4a/double3x3a/bn/sc"
+  name: "inception_4a/double3x3a/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4a/double3x3a/bn/sc"
+  top: "inception_4a/double3x3b"
+  name: "inception_4a/double3x3b"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4a/double3x3b"
+  name: "inception_4a/double3x3b/bn"
+  top: "inception_4a/double3x3b/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4a/double3x3b/bn"
+  top: "inception_4a/double3x3b/bn/sc"
+  name: "inception_4a/double3x3b/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4a/double3x3b/bn/sc"
+  top: "inception_4a/double3x3b/bn/sc"
+  name: "inception_4a/double3x3b/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_3c/output"
+  top: "inception_4a/pool"
+  name: "inception_4a/pool"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: AVE
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+ bottom: "inception_4a/pool"
+  top: "inception_4a/pool_proj"
+  name: "inception_4a/pool_proj"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4a/pool_proj"
+  name: "inception_4a/pool_proj/bn"
+  top: "inception_4a/pool_proj/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4a/pool_proj/bn"
+  top: "inception_4a/pool_proj/bn/sc"
+  name: "inception_4a/pool_proj/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4a/pool_proj/bn/sc"
+  top: "inception_4a/pool_proj/bn/sc"
+  name: "inception_4a/pool_proj/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4a/1x1/bn/sc"
+  bottom: "inception_4a/3x3/bn/sc"
+  bottom: "inception_4a/double3x3b/bn/sc"
+  bottom: "inception_4a/pool_proj/bn/sc"
+  top: "inception_4a/output"
+  name: "inception_4a/output"
+  type: "Concat"
+  concat_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4a/output"
+  top: "inception_4b/1x1"
+  name: "inception_4b/1x1"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 192
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4b/1x1"
+  name: "inception_4b/1x1/bn"
+  top: "inception_4b/1x1/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4b/1x1/bn"
+  top: "inception_4b/1x1/bn/sc"
+  name: "inception_4b/1x1/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4b/1x1/bn/sc"
+  top: "inception_4b/1x1/bn/sc"
+  name: "inception_4b/1x1/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4a/output"
+  top: "inception_4b/3x3_reduce"
+  name: "inception_4b/3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4b/3x3_reduce"
+  name: "inception_4b/3x3_reduce/bn"
+  top: "inception_4b/3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4b/3x3_reduce/bn"
+  top: "inception_4b/3x3_reduce/bn/sc"
+  name: "inception_4b/3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4b/3x3_reduce/bn/sc"
+  top: "inception_4b/3x3_reduce/bn/sc"
+  name: "inception_4b/3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4b/3x3_reduce/bn/sc"
+  top: "inception_4b/3x3"
+  name: "inception_4b/3x3"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4b/3x3"
+  name: "inception_4b/3x3/bn"
+  top: "inception_4b/3x3/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4b/3x3/bn"
+  top: "inception_4b/3x3/bn/sc"
+  name: "inception_4b/3x3/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4b/3x3/bn/sc"
+  top: "inception_4b/3x3/bn/sc"
+  name: "inception_4b/3x3/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4a/output"
+  top: "inception_4b/double3x3_reduce"
+  name: "inception_4b/double3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4b/double3x3_reduce"
+  name: "inception_4b/double3x3_reduce/bn"
+  top: "inception_4b/double3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4b/double3x3_reduce/bn"
+  top: "inception_4b/double3x3_reduce/bn/sc"
+  name: "inception_4b/double3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4b/double3x3_reduce/bn/sc"
+  top: "inception_4b/double3x3_reduce/bn/sc"
+  name: "inception_4b/double3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4b/double3x3_reduce/bn/sc"
+  top: "inception_4b/double3x3a"
+  name: "inception_4b/double3x3a"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4b/double3x3a"
+  name: "inception_4b/double3x3a/bn"
+  top: "inception_4b/double3x3a/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4b/double3x3a/bn"
+  top: "inception_4b/double3x3a/bn/sc"
+  name: "inception_4b/double3x3a/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4b/double3x3a/bn/sc"
+  top: "inception_4b/double3x3a/bn/sc"
+  name: "inception_4b/double3x3a/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4b/double3x3a/bn/sc"
+  top: "inception_4b/double3x3b"
+  name: "inception_4b/double3x3b"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4b/double3x3b"
+  name: "inception_4b/double3x3b/bn"
+  top: "inception_4b/double3x3b/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4b/double3x3b/bn"
+  top: "inception_4b/double3x3b/bn/sc"
+  name: "inception_4b/double3x3b/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4b/double3x3b/bn/sc"
+  top: "inception_4b/double3x3b/bn/sc"
+  name: "inception_4b/double3x3b/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4a/output"
+  top: "inception_4b/pool"
+  name: "inception_4b/pool"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: AVE
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+ bottom: "inception_4b/pool"
+  top: "inception_4b/pool_proj"
+  name: "inception_4b/pool_proj"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4b/pool_proj"
+  name: "inception_4b/pool_proj/bn"
+  top: "inception_4b/pool_proj/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4b/pool_proj/bn"
+  top: "inception_4b/pool_proj/bn/sc"
+  name: "inception_4b/pool_proj/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4b/pool_proj/bn/sc"
+  top: "inception_4b/pool_proj/bn/sc"
+  name: "inception_4b/pool_proj/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4b/1x1/bn/sc"
+  bottom: "inception_4b/3x3/bn/sc"
+  bottom: "inception_4b/double3x3b/bn/sc"
+  bottom: "inception_4b/pool_proj/bn/sc"
+  top: "inception_4b/output"
+  name: "inception_4b/output"
+  type: "Concat"
+  concat_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4b/output"
+  top: "inception_4c/1x1"
+  name: "inception_4c/1x1"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 160
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4c/1x1"
+  name: "inception_4c/1x1/bn"
+  top: "inception_4c/1x1/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4c/1x1/bn"
+  top: "inception_4c/1x1/bn/sc"
+  name: "inception_4c/1x1/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4c/1x1/bn/sc"
+  top: "inception_4c/1x1/bn/sc"
+  name: "inception_4c/1x1/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4b/output"
+  top: "inception_4c/3x3_reduce"
+  name: "inception_4c/3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4c/3x3_reduce"
+  name: "inception_4c/3x3_reduce/bn"
+  top: "inception_4c/3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4c/3x3_reduce/bn"
+  top: "inception_4c/3x3_reduce/bn/sc"
+  name: "inception_4c/3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4c/3x3_reduce/bn/sc"
+  top: "inception_4c/3x3_reduce/bn/sc"
+  name: "inception_4c/3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4c/3x3_reduce/bn/sc"
+  top: "inception_4c/3x3"
+  name: "inception_4c/3x3"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 160
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4c/3x3"
+  name: "inception_4c/3x3/bn"
+  top: "inception_4c/3x3/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4c/3x3/bn"
+  top: "inception_4c/3x3/bn/sc"
+  name: "inception_4c/3x3/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4c/3x3/bn/sc"
+  top: "inception_4c/3x3/bn/sc"
+  name: "inception_4c/3x3/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4b/output"
+  top: "inception_4c/double3x3_reduce"
+  name: "inception_4c/double3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4c/double3x3_reduce"
+  name: "inception_4c/double3x3_reduce/bn"
+  top: "inception_4c/double3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4c/double3x3_reduce/bn"
+  top: "inception_4c/double3x3_reduce/bn/sc"
+  name: "inception_4c/double3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4c/double3x3_reduce/bn/sc"
+  top: "inception_4c/double3x3_reduce/bn/sc"
+  name: "inception_4c/double3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4c/double3x3_reduce/bn/sc"
+  top: "inception_4c/double3x3a"
+  name: "inception_4c/double3x3a"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 160
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4c/double3x3a"
+  name: "inception_4c/double3x3a/bn"
+  top: "inception_4c/double3x3a/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4c/double3x3a/bn"
+  top: "inception_4c/double3x3a/bn/sc"
+  name: "inception_4c/double3x3a/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4c/double3x3a/bn/sc"
+  top: "inception_4c/double3x3a/bn/sc"
+  name: "inception_4c/double3x3a/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4c/double3x3a/bn/sc"
+  top: "inception_4c/double3x3b"
+  name: "inception_4c/double3x3b"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 160
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4c/double3x3b"
+  name: "inception_4c/double3x3b/bn"
+  top: "inception_4c/double3x3b/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4c/double3x3b/bn"
+  top: "inception_4c/double3x3b/bn/sc"
+  name: "inception_4c/double3x3b/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4c/double3x3b/bn/sc"
+  top: "inception_4c/double3x3b/bn/sc"
+  name: "inception_4c/double3x3b/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4b/output"
+  top: "inception_4c/pool"
+  name: "inception_4c/pool"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: AVE
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+ bottom: "inception_4c/pool"
+  top: "inception_4c/pool_proj"
+  name: "inception_4c/pool_proj"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4c/pool_proj"
+  name: "inception_4c/pool_proj/bn"
+  top: "inception_4c/pool_proj/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4c/pool_proj/bn"
+  top: "inception_4c/pool_proj/bn/sc"
+  name: "inception_4c/pool_proj/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4c/pool_proj/bn/sc"
+  top: "inception_4c/pool_proj/bn/sc"
+  name: "inception_4c/pool_proj/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4c/1x1/bn/sc"
+  bottom: "inception_4c/3x3/bn/sc"
+  bottom: "inception_4c/double3x3b/bn/sc"
+  bottom: "inception_4c/pool_proj/bn/sc"
+  top: "inception_4c/output"
+  name: "inception_4c/output"
+  type: "Concat"
+  concat_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4c/output"
+  top: "inception_4d/1x1"
+  name: "inception_4d/1x1"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4d/1x1"
+  name: "inception_4d/1x1/bn"
+  top: "inception_4d/1x1/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4d/1x1/bn"
+  top: "inception_4d/1x1/bn/sc"
+  name: "inception_4d/1x1/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4d/1x1/bn/sc"
+  top: "inception_4d/1x1/bn/sc"
+  name: "inception_4d/1x1/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4c/output"
+  top: "inception_4d/3x3_reduce"
+  name: "inception_4d/3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4d/3x3_reduce"
+  name: "inception_4d/3x3_reduce/bn"
+  top: "inception_4d/3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4d/3x3_reduce/bn"
+  top: "inception_4d/3x3_reduce/bn/sc"
+  name: "inception_4d/3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4d/3x3_reduce/bn/sc"
+  top: "inception_4d/3x3_reduce/bn/sc"
+  name: "inception_4d/3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4d/3x3_reduce/bn/sc"
+  top: "inception_4d/3x3"
+  name: "inception_4d/3x3"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 192
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4d/3x3"
+  name: "inception_4d/3x3/bn"
+  top: "inception_4d/3x3/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4d/3x3/bn"
+  top: "inception_4d/3x3/bn/sc"
+  name: "inception_4d/3x3/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4d/3x3/bn/sc"
+  top: "inception_4d/3x3/bn/sc"
+  name: "inception_4d/3x3/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4c/output"
+  top: "inception_4d/double3x3_reduce"
+  name: "inception_4d/double3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 160
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4d/double3x3_reduce"
+  name: "inception_4d/double3x3_reduce/bn"
+  top: "inception_4d/double3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4d/double3x3_reduce/bn"
+  top: "inception_4d/double3x3_reduce/bn/sc"
+  name: "inception_4d/double3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4d/double3x3_reduce/bn/sc"
+  top: "inception_4d/double3x3_reduce/bn/sc"
+  name: "inception_4d/double3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4d/double3x3_reduce/bn/sc"
+  top: "inception_4d/double3x3a"
+  name: "inception_4d/double3x3a"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 192
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4d/double3x3a"
+  name: "inception_4d/double3x3a/bn"
+  top: "inception_4d/double3x3a/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4d/double3x3a/bn"
+  top: "inception_4d/double3x3a/bn/sc"
+  name: "inception_4d/double3x3a/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4d/double3x3a/bn/sc"
+  top: "inception_4d/double3x3a/bn/sc"
+  name: "inception_4d/double3x3a/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4d/double3x3a/bn/sc"
+  top: "inception_4d/double3x3b"
+  name: "inception_4d/double3x3b"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 192
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4d/double3x3b"
+  name: "inception_4d/double3x3b/bn"
+  top: "inception_4d/double3x3b/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4d/double3x3b/bn"
+  top: "inception_4d/double3x3b/bn/sc"
+  name: "inception_4d/double3x3b/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4d/double3x3b/bn/sc"
+  top: "inception_4d/double3x3b/bn/sc"
+  name: "inception_4d/double3x3b/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4c/output"
+  top: "inception_4d/pool"
+  name: "inception_4d/pool"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: AVE
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+ bottom: "inception_4d/pool"
+  top: "inception_4d/pool_proj"
+  name: "inception_4d/pool_proj"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 96
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4d/pool_proj"
+  name: "inception_4d/pool_proj/bn"
+  top: "inception_4d/pool_proj/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4d/pool_proj/bn"
+  top: "inception_4d/pool_proj/bn/sc"
+  name: "inception_4d/pool_proj/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4d/pool_proj/bn/sc"
+  top: "inception_4d/pool_proj/bn/sc"
+  name: "inception_4d/pool_proj/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4d/1x1/bn/sc"
+  bottom: "inception_4d/3x3/bn/sc"
+  bottom: "inception_4d/double3x3b/bn/sc"
+  bottom: "inception_4d/pool_proj/bn/sc"
+  top: "inception_4d/output"
+  name: "inception_4d/output"
+  type: "Concat"
+  concat_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4d/output"
+  top: "inception_4e/3x3_reduce"
+  name: "inception_4e/3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4e/3x3_reduce"
+  name: "inception_4e/3x3_reduce/bn"
+  top: "inception_4e/3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4e/3x3_reduce/bn"
+  top: "inception_4e/3x3_reduce/bn/sc"
+  name: "inception_4e/3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4e/3x3_reduce/bn/sc"
+  top: "inception_4e/3x3_reduce/bn/sc"
+  name: "inception_4e/3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4e/3x3_reduce/bn/sc"
+  top: "inception_4e/3x3"
+  name: "inception_4e/3x3"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 192
+    pad: 1
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4e/3x3"
+  name: "inception_4e/3x3/bn"
+  top: "inception_4e/3x3/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4e/3x3/bn"
+  top: "inception_4e/3x3/bn/sc"
+  name: "inception_4e/3x3/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4e/3x3/bn/sc"
+  top: "inception_4e/3x3/bn/sc"
+  name: "inception_4e/3x3/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4d/output"
+  top: "inception_4e/double3x3_reduce"
+  name: "inception_4e/double3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 192
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4e/double3x3_reduce"
+  name: "inception_4e/double3x3_reduce/bn"
+  top: "inception_4e/double3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4e/double3x3_reduce/bn"
+  top: "inception_4e/double3x3_reduce/bn/sc"
+  name: "inception_4e/double3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4e/double3x3_reduce/bn/sc"
+  top: "inception_4e/double3x3_reduce/bn/sc"
+  name: "inception_4e/double3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4e/double3x3_reduce/bn/sc"
+  top: "inception_4e/double3x3a"
+  name: "inception_4e/double3x3a"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4e/double3x3a"
+  name: "inception_4e/double3x3a/bn"
+  top: "inception_4e/double3x3a/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4e/double3x3a/bn"
+  top: "inception_4e/double3x3a/bn/sc"
+  name: "inception_4e/double3x3a/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4e/double3x3a/bn/sc"
+  top: "inception_4e/double3x3a/bn/sc"
+  name: "inception_4e/double3x3a/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4e/double3x3a/bn/sc"
+  top: "inception_4e/double3x3b"
+  name: "inception_4e/double3x3b"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_4e/double3x3b"
+  name: "inception_4e/double3x3b/bn"
+  top: "inception_4e/double3x3b/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4e/double3x3b/bn"
+  top: "inception_4e/double3x3b/bn/sc"
+  name: "inception_4e/double3x3b/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_4e/double3x3b/bn/sc"
+  top: "inception_4e/double3x3b/bn/sc"
+  name: "inception_4e/double3x3b/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4d/output"
+  top: "inception_4e/pool"
+  name: "inception_4e/pool"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  bottom: "inception_4e/3x3/bn/sc"
+  bottom: "inception_4e/double3x3b/bn/sc"
+  bottom: "inception_4e/pool"
+  top: "inception_4e/output"
+  name: "inception_4e/output"
+  type: "Concat"
+  concat_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4e/output"
+  top: "pool4/5x5_s3"
+  name: "pool4/5x5_s3"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: AVE
+    kernel_size: 5
+    stride: 3
+  }
+}
+layer {
+ bottom: "pool4/5x5_s3"
+  top: "loss2/conv"
+  name: "loss2/conv"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "loss2/conv"
+  name: "loss2/conv/bn"
+  top: "loss2/conv/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "loss2/conv/bn"
+  top: "loss2/conv/bn/sc"
+  name: "loss2/conv/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "loss2/conv/bn/sc"
+  top: "loss2/conv/bn/sc"
+  name: "loss2/conv/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "loss2/conv/bn/sc"
+  top: "loss2/fc"
+  name: "loss2/fc"
+  type: "InnerProduct"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  inner_product_param {
+    num_output: 1024
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "loss2/fc"
+  name: "loss2/fc/bn"
+  top: "loss2/fc/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "loss2/fc/bn"
+  top: "loss2/fc/bn/sc"
+  name: "loss2/fc/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "loss2/fc/bn/sc"
+  top: "loss2/fc/bn/sc"
+  name: "loss2/fc/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "loss2/fc/bn/sc"
+  top: "loss2/classifier"
+  name: "loss2/classifier"
+  type: "InnerProduct"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  bottom: "loss2/classifier"
+  bottom: "label"
+  top: "loss2/loss"
+  name: "loss2/loss"
+  type: "SoftmaxWithLoss"
+  loss_weight: 0.3
+}
+layer {
+  bottom: "loss2/classifier"
+  top: "loss2/prob"
+  name: "loss2/prob"
+  type: "Softmax"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  bottom: "loss2/prob"
+  bottom: "label"
+  top: "loss2/top-1"
+  name: "loss2/top-1"
+  type: "Accuracy"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  bottom: "loss2/prob"
+  bottom: "label"
+  top: "loss2/top-5"
+  name: "loss2/top-5"
+  type: "Accuracy"
+  accuracy_param {
+    top_k: 5
+  }
+  include {
+    phase: TEST
+  }
+}
+layer {
+ bottom: "inception_4e/output"
+  top: "inception_5a/1x1"
+  name: "inception_5a/1x1"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 352
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5a/1x1"
+  name: "inception_5a/1x1/bn"
+  top: "inception_5a/1x1/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5a/1x1/bn"
+  top: "inception_5a/1x1/bn/sc"
+  name: "inception_5a/1x1/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5a/1x1/bn/sc"
+  top: "inception_5a/1x1/bn/sc"
+  name: "inception_5a/1x1/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4e/output"
+  top: "inception_5a/3x3_reduce"
+  name: "inception_5a/3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 192
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5a/3x3_reduce"
+  name: "inception_5a/3x3_reduce/bn"
+  top: "inception_5a/3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5a/3x3_reduce/bn"
+  top: "inception_5a/3x3_reduce/bn/sc"
+  name: "inception_5a/3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5a/3x3_reduce/bn/sc"
+  top: "inception_5a/3x3_reduce/bn/sc"
+  name: "inception_5a/3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_5a/3x3_reduce/bn/sc"
+  top: "inception_5a/3x3"
+  name: "inception_5a/3x3"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 320
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5a/3x3"
+  name: "inception_5a/3x3/bn"
+  top: "inception_5a/3x3/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5a/3x3/bn"
+  top: "inception_5a/3x3/bn/sc"
+  name: "inception_5a/3x3/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5a/3x3/bn/sc"
+  top: "inception_5a/3x3/bn/sc"
+  name: "inception_5a/3x3/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_4e/output"
+  top: "inception_5a/double3x3_reduce"
+  name: "inception_5a/double3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 160
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5a/double3x3_reduce"
+  name: "inception_5a/double3x3_reduce/bn"
+  top: "inception_5a/double3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5a/double3x3_reduce/bn"
+  top: "inception_5a/double3x3_reduce/bn/sc"
+  name: "inception_5a/double3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5a/double3x3_reduce/bn/sc"
+  top: "inception_5a/double3x3_reduce/bn/sc"
+  name: "inception_5a/double3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_5a/double3x3_reduce/bn/sc"
+  top: "inception_5a/double3x3a"
+  name: "inception_5a/double3x3a"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 224
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5a/double3x3a"
+  name: "inception_5a/double3x3a/bn"
+  top: "inception_5a/double3x3a/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5a/double3x3a/bn"
+  top: "inception_5a/double3x3a/bn/sc"
+  name: "inception_5a/double3x3a/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5a/double3x3a/bn/sc"
+  top: "inception_5a/double3x3a/bn/sc"
+  name: "inception_5a/double3x3a/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_5a/double3x3a/bn/sc"
+  top: "inception_5a/double3x3b"
+  name: "inception_5a/double3x3b"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 224
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5a/double3x3b"
+  name: "inception_5a/double3x3b/bn"
+  top: "inception_5a/double3x3b/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5a/double3x3b/bn"
+  top: "inception_5a/double3x3b/bn/sc"
+  name: "inception_5a/double3x3b/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5a/double3x3b/bn/sc"
+  top: "inception_5a/double3x3b/bn/sc"
+  name: "inception_5a/double3x3b/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_4e/output"
+  top: "inception_5a/pool"
+  name: "inception_5a/pool"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: AVE
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+ bottom: "inception_5a/pool"
+  top: "inception_5a/pool_proj"
+  name: "inception_5a/pool_proj"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5a/pool_proj"
+  name: "inception_5a/pool_proj/bn"
+  top: "inception_5a/pool_proj/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5a/pool_proj/bn"
+  top: "inception_5a/pool_proj/bn/sc"
+  name: "inception_5a/pool_proj/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5a/pool_proj/bn/sc"
+  top: "inception_5a/pool_proj/bn/sc"
+  name: "inception_5a/pool_proj/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5a/1x1/bn/sc"
+  bottom: "inception_5a/3x3/bn/sc"
+  bottom: "inception_5a/double3x3b/bn/sc"
+  bottom: "inception_5a/pool_proj/bn/sc"
+  top: "inception_5a/output"
+  name: "inception_5a/output"
+  type: "Concat"
+  concat_param {
+    
+  }
+}
+layer {
+ bottom: "inception_5a/output"
+  top: "inception_5b/1x1"
+  name: "inception_5b/1x1"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 352
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5b/1x1"
+  name: "inception_5b/1x1/bn"
+  top: "inception_5b/1x1/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5b/1x1/bn"
+  top: "inception_5b/1x1/bn/sc"
+  name: "inception_5b/1x1/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5b/1x1/bn/sc"
+  top: "inception_5b/1x1/bn/sc"
+  name: "inception_5b/1x1/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_5a/output"
+  top: "inception_5b/3x3_reduce"
+  name: "inception_5b/3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 192
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5b/3x3_reduce"
+  name: "inception_5b/3x3_reduce/bn"
+  top: "inception_5b/3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5b/3x3_reduce/bn"
+  top: "inception_5b/3x3_reduce/bn/sc"
+  name: "inception_5b/3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5b/3x3_reduce/bn/sc"
+  top: "inception_5b/3x3_reduce/bn/sc"
+  name: "inception_5b/3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_5b/3x3_reduce/bn/sc"
+  top: "inception_5b/3x3"
+  name: "inception_5b/3x3"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 320
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5b/3x3"
+  name: "inception_5b/3x3/bn"
+  top: "inception_5b/3x3/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5b/3x3/bn"
+  top: "inception_5b/3x3/bn/sc"
+  name: "inception_5b/3x3/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5b/3x3/bn/sc"
+  top: "inception_5b/3x3/bn/sc"
+  name: "inception_5b/3x3/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_5a/output"
+  top: "inception_5b/double3x3_reduce"
+  name: "inception_5b/double3x3_reduce"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 192
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5b/double3x3_reduce"
+  name: "inception_5b/double3x3_reduce/bn"
+  top: "inception_5b/double3x3_reduce/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5b/double3x3_reduce/bn"
+  top: "inception_5b/double3x3_reduce/bn/sc"
+  name: "inception_5b/double3x3_reduce/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5b/double3x3_reduce/bn/sc"
+  top: "inception_5b/double3x3_reduce/bn/sc"
+  name: "inception_5b/double3x3_reduce/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_5b/double3x3_reduce/bn/sc"
+  top: "inception_5b/double3x3a"
+  name: "inception_5b/double3x3a"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 224
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5b/double3x3a"
+  name: "inception_5b/double3x3a/bn"
+  top: "inception_5b/double3x3a/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5b/double3x3a/bn"
+  top: "inception_5b/double3x3a/bn/sc"
+  name: "inception_5b/double3x3a/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5b/double3x3a/bn/sc"
+  top: "inception_5b/double3x3a/bn/sc"
+  name: "inception_5b/double3x3a/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+ bottom: "inception_5b/double3x3a/bn/sc"
+  top: "inception_5b/double3x3b"
+  name: "inception_5b/double3x3b"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 224
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5b/double3x3b"
+  name: "inception_5b/double3x3b/bn"
+  top: "inception_5b/double3x3b/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5b/double3x3b/bn"
+  top: "inception_5b/double3x3b/bn/sc"
+  name: "inception_5b/double3x3b/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5b/double3x3b/bn/sc"
+  top: "inception_5b/double3x3b/bn/sc"
+  name: "inception_5b/double3x3b/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5a/output"
+  top: "inception_5b/pool"
+  name: "inception_5b/pool"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: MAX
+    kernel_size: 3
+    stride: 1
+    pad: 1
+  }
+}
+layer {
+ bottom: "inception_5b/pool"
+  top: "inception_5b/pool_proj"
+  name: "inception_5b/pool_proj"
+  type: "Convolution"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_term: false
+  }
+}
+layer {
+  bottom: "inception_5b/pool_proj"
+  name: "inception_5b/pool_proj/bn"
+  top: "inception_5b/pool_proj/bn"
+  type: "BatchNorm"
+  batch_norm_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5b/pool_proj/bn"
+  top: "inception_5b/pool_proj/bn/sc"
+  name: "inception_5b/pool_proj/bn/sc"
+  type: "Scale"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  bottom: "inception_5b/pool_proj/bn/sc"
+  top: "inception_5b/pool_proj/bn/sc"
+  name: "inception_5b/pool_proj/bn/sc/relu"
+  type: "ReLU"
+  relu_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5b/1x1/bn/sc"
+  bottom: "inception_5b/3x3/bn/sc"
+  bottom: "inception_5b/double3x3b/bn/sc"
+  bottom: "inception_5b/pool_proj/bn/sc"
+  top: "inception_5b/output"
+  name: "inception_5b/output"
+  type: "Concat"
+  concat_param {
+    
+  }
+}
+layer {
+  bottom: "inception_5b/output"
+  top: "pool5/7x7_s1"
+  name: "pool5/7x7_s1"
+  type: "Pooling"
+  pooling_param {
+    
+    pool: AVE
+    kernel_size: 7
+    stride: 1
+  }
+}
+layer {
+  bottom: "pool5/7x7_s1"
+  top: "loss3/classifier"
+  name: "loss3/classifier"
+  type: "InnerProduct"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  bottom: "loss3/classifier"
+  bottom: "label"
+  top: "loss3/loss"
+  name: "loss3/loss"
+  type: "SoftmaxWithLoss"
+  loss_weight: 1
+}
+layer {
+  bottom: "loss3/classifier"
+  top: "loss3/prob"
+  name: "loss3/prob"
+  type: "Softmax"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  bottom: "loss3/prob"
+  bottom: "label"
+  top: "loss3/top-1"
+  name: "loss3/top-1"
+  type: "Accuracy"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  bottom: "loss3/prob"
+  bottom: "label"
+  top: "loss3/top-5"
+  name: "loss3/top-5"
+  type: "Accuracy"
+  accuracy_param {
+    top_k: 5
+  }
+  include {
+    phase: TEST
+  }
+}
diff --git a/models/intel_optimized_models/resnet_50/solver.prototxt b/models/intel_optimized_models/resnet_50/solver.prototxt
new file mode 100644
index 000000000..2fe9feb99
--- /dev/null
+++ b/models/intel_optimized_models/resnet_50/solver.prototxt
@@ -0,0 +1,17 @@
+net: "models/intel_optimized_models/resnet_50/train_val.prototxt"
+test_iter: 1000
+test_interval: 1248
+test_initialization: false
+display: 40
+base_lr: 0.4
+lr_policy: "multistep"
+stepvalue:37440
+stepvalue:74880
+stepvalue:99840
+gamma: 0.1
+max_iter: 112600
+momentum: 0.9
+weight_decay: 0.0001
+snapshot: 12480
+snapshot_prefix: "models/intel_optimized_models/resnet_50/resnet_50_"
+solver_mode: CPU
diff --git a/models/intel_optimized_models/resnet_50/solver_dummydata.prototxt b/models/intel_optimized_models/resnet_50/solver_dummydata.prototxt
new file mode 100644
index 000000000..3ba69689f
--- /dev/null
+++ b/models/intel_optimized_models/resnet_50/solver_dummydata.prototxt
@@ -0,0 +1,25 @@
+#This is Intel(R) optimized (in terms of time to train) version of solver for model described in the [AlexNet](http://papers.nips.cc/paper/4824-imagenet-classification-with-deep-convolutional-neural-networks) publication.
+#Original solver.prototxt can be found in /models/bvlc_alexnet/ directory of this repository.
+#Differences:
+#- lr_policy is set to poly instead of step
+#- base_lr is decreased to 0.007
+#- max_iter is decreased to 250000
+#- power is set to 0.6
+#
+#Top-5 and Top-1 results achieved with this version of solver:
+#Top-5: 80.4%
+#Top-1: 57.4%
+#Training was performed using server equipped with Intel(R) Xeon Phi(TM) CPU 7250 processor. 
+net: "models/intel_optimized_models/resnet_50/train_val_dummydata.prototxt"
+test_iter: 1000
+test_interval: 10000
+base_lr: 0.007
+lr_policy: "poly"
+power: 0.6
+display: 1
+max_iter: 5000
+momentum: 0.9
+weight_decay: 0.0005
+snapshot: 50000
+snapshot_prefix: "models/intel_optimized_models/resnet_50/resnet_50_train"
+solver_mode: CPU
diff --git a/models/intel_optimized_models/resnet_50/train_val.prototxt b/models/intel_optimized_models/resnet_50/train_val.prototxt
new file mode 100644
index 000000000..75bff6269
--- /dev/null
+++ b/models/intel_optimized_models/resnet_50/train_val.prototxt
@@ -0,0 +1,3322 @@
+name: "ResNet-50"
+bn_stats_batch_size: 32
+layer {
+  name: "data"
+  type: "Data"
+  top: "data"
+  top: "label"
+  include {
+    phase: TRAIN
+  }
+  transform_param {
+    mirror: true
+    crop_size: 224
+    scale: 0.0078125
+    mean_value: 104
+    mean_value: 117
+    mean_value: 123
+    random_aspect_ratio_param {
+      min_area_ratio: 0.08
+      max_area_ratio: 1
+      aspect_ratio_change: 0.75
+      resize_param {
+        interp_mode: CUBIC
+      }
+    }
+  }
+  data_param {
+    source: "examples/imagenet/ilsvrc12_train_lmdb"
+    batch_size: 128
+    backend: LMDB
+    prefetch: 2
+    shuffle: true
+  }
+}
+layer {
+  name: "data"
+  type: "Data"
+  top: "data"
+  top: "label"
+  include {
+    phase: TEST
+  }
+  transform_param {
+    mirror: false
+    crop_size: 224
+    scale: 0.0078125
+    mean_value: 104
+    mean_value: 117
+    mean_value: 123
+    random_resize_param {
+      min_size: 256
+      max_size: 256
+      resize_param {
+        interp_mode: CUBIC
+      }
+    }
+  }
+  data_param {
+    source: "examples/imagenet/ilsvrc12_val_lmdb"
+    batch_size: 50
+    backend: LMDB
+  }
+}
+
+layer {
+  bottom: "data"
+  top: "conv1"
+  name: "conv1"
+  type: "Convolution"
+  convolution_param {
+    num_output: 64
+    kernel_size: 7
+    pad: 3
+    stride: 2
+    weight_filler {
+      type: "msra"
+      variance_norm: FAN_OUT
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "conv1"
+  top: "conv1"
+  name: "bn_conv1"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "conv1"
+  top: "conv1"
+  name: "scale_conv1"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "conv1"
+  top: "conv1"
+  name: "conv1_relu"
+  type: "ReLU"
+  relu_param {
+  }
+}
+
+layer {
+  bottom: "conv1"
+  top: "pool1"
+  name: "pool1"
+  type: "Pooling"
+  pooling_param {
+    kernel_size: 3
+    stride: 2
+    pool: MAX
+  }
+}
+
+layer {
+  bottom: "pool1"
+  top: "res2a_branch1"
+  name: "res2a_branch1"
+  type: "Convolution"
+  convolution_param {
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2a_branch1"
+  top: "res2a_branch1"
+  name: "bn2a_branch1"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2a_branch1"
+  top: "res2a_branch1"
+  name: "scale2a_branch1"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "pool1"
+  top: "res2a_branch2a"
+  name: "res2a_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 64
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2a"
+  name: "bn2a_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2a"
+  name: "scale2a_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2a"
+  name: "res2a_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2b"
+  name: "res2a_branch2b"
+  type: "Convolution"
+  convolution_param {
+    num_output: 64
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2b"
+  name: "bn2a_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2b"
+  name: "scale2a_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2b"
+  name: "res2a_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2c"
+  name: "res2a_branch2c"
+  type: "Convolution"
+  convolution_param {
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2a_branch2c"
+  top: "res2a_branch2c"
+  name: "bn2a_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2a_branch2c"
+  top: "res2a_branch2c"
+  name: "scale2a_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2a_branch1"
+  bottom: "res2a_branch2c"
+  top: "res2a"
+  name: "res2a"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res2a"
+  top: "res2a"
+  name: "res2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2a"
+  top: "res2b_branch2a"
+  name: "res2b_branch2a"
+  type: "Convolution"
+  convolution_param {
+    num_output: 64
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2a"
+  name: "bn2b_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2a"
+  name: "scale2b_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2a"
+  name: "res2b_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2b"
+  name: "res2b_branch2b"
+  type: "Convolution"
+  convolution_param {
+    num_output: 64
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2b"
+  name: "bn2b_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2b"
+  name: "scale2b_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2b"
+  name: "res2b_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2c"
+  name: "res2b_branch2c"
+  type: "Convolution"
+  convolution_param {
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2b_branch2c"
+  top: "res2b_branch2c"
+  name: "bn2b_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2b_branch2c"
+  top: "res2b_branch2c"
+  name: "scale2b_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2a"
+  bottom: "res2b_branch2c"
+  top: "res2b"
+  name: "res2b"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res2b"
+  top: "res2b"
+  name: "res2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2b"
+  top: "res2c_branch2a"
+  name: "res2c_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 64
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2a"
+  name: "bn2c_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2a"
+  name: "scale2c_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2a"
+  name: "res2c_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2b"
+  name: "res2c_branch2b"
+  type: "Convolution"
+  convolution_param {
+    num_output: 64
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2b"
+  name: "bn2c_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2b"
+  name: "scale2c_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2b"
+  name: "res2c_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2c"
+  name: "res2c_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res2c_branch2c"
+  top: "res2c_branch2c"
+  name: "bn2c_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+  filler { value: 0 }
+  }
+}
+
+layer {
+  bottom: "res2c_branch2c"
+  top: "res2c_branch2c"
+  name: "scale2c_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2b"
+  bottom: "res2c_branch2c"
+  top: "res2c"
+  name: "res2c"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res2c"
+  top: "res2c"
+  name: "res2c_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res2c"
+  top: "res3a_branch1"
+  name: "res3a_branch1"
+  type: "Convolution"
+  convolution_param {
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 2
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3a_branch1"
+  top: "res3a_branch1"
+  name: "bn3a_branch1"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3a_branch1"
+  top: "res3a_branch1"
+  name: "scale3a_branch1"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res2c"
+  top: "res3a_branch2a"
+  name: "res3a_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 128
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2a"
+  name: "bn3a_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2a"
+  name: "scale3a_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2a"
+  name: "res3a_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2b"
+  name: "res3a_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 128
+    kernel_size: 3
+    pad: 1
+    stride: 2
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2b"
+  name: "bn3a_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2b"
+  name: "scale3a_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2b"
+  name: "res3a_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2c"
+  name: "res3a_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3a_branch2c"
+  top: "res3a_branch2c"
+  name: "bn3a_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3a_branch2c"
+  top: "res3a_branch2c"
+  name: "scale3a_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3a_branch1"
+  bottom: "res3a_branch2c"
+  top: "res3a"
+  name: "res3a"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res3a"
+  top: "res3a"
+  name: "res3a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3a"
+  top: "res3b_branch2a"
+  name: "res3b_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 128
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2a"
+  name: "bn3b_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2a"
+  name: "scale3b_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2a"
+  name: "res3b_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2b"
+  name: "res3b_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 128
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2b"
+  name: "bn3b_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2b"
+  name: "scale3b_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2b"
+  name: "res3b_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2c"
+  name: "res3b_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3b_branch2c"
+  top: "res3b_branch2c"
+  name: "bn3b_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3b_branch2c"
+  top: "res3b_branch2c"
+  name: "scale3b_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3a"
+  bottom: "res3b_branch2c"
+  top: "res3b"
+  name: "res3b"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res3b"
+  top: "res3b"
+  name: "res3b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3b"
+  top: "res3c_branch2a"
+  name: "res3c_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 128
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2a"
+  name: "bn3c_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2a"
+  name: "scale3c_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2a"
+  name: "res3c_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2b"
+  name: "res3c_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 128
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2b"
+  name: "bn3c_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2b"
+  name: "scale3c_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2b"
+  name: "res3c_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2c"
+  name: "res3c_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3c_branch2c"
+  top: "res3c_branch2c"
+  name: "bn3c_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3c_branch2c"
+  top: "res3c_branch2c"
+  name: "scale3c_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3b"
+  bottom: "res3c_branch2c"
+  top: "res3c"
+  name: "res3c"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res3c"
+  top: "res3c"
+  name: "res3c_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3c"
+  top: "res3d_branch2a"
+  name: "res3d_branch2a"
+  type: "Convolution"
+  convolution_param {
+    num_output: 128
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2a"
+  name: "bn3d_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2a"
+  name: "scale3d_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2a"
+  name: "res3d_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2b"
+  name: "res3d_branch2b"
+  type: "Convolution"
+  convolution_param {
+    num_output: 128
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2b"
+  name: "bn3d_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2b"
+  name: "scale3d_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2b"
+  name: "res3d_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2c"
+  name: "res3d_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res3d_branch2c"
+  top: "res3d_branch2c"
+  name: "bn3d_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+  filler { value: 0 }
+  }
+}
+
+layer {
+  bottom: "res3d_branch2c"
+  top: "res3d_branch2c"
+  name: "scale3d_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3c"
+  bottom: "res3d_branch2c"
+  top: "res3d"
+  name: "res3d"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res3d"
+  top: "res3d"
+  name: "res3d_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res3d"
+  top: "res4a_branch1"
+  name: "res4a_branch1"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 2
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4a_branch1"
+  top: "res4a_branch1"
+  name: "bn4a_branch1"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4a_branch1"
+  top: "res4a_branch1"
+  name: "scale4a_branch1"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res3d"
+  top: "res4a_branch2a"
+  name: "res4a_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2a"
+  name: "bn4a_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2a"
+  name: "scale4a_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2a"
+  name: "res4a_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2b"
+  name: "res4a_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 3
+    pad: 1
+    stride: 2
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2b"
+  name: "bn4a_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2b"
+  name: "scale4a_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2b"
+  name: "res4a_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2c"
+  name: "res4a_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4a_branch2c"
+  top: "res4a_branch2c"
+  name: "bn4a_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4a_branch2c"
+  top: "res4a_branch2c"
+  name: "scale4a_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4a_branch1"
+  bottom: "res4a_branch2c"
+  top: "res4a"
+  name: "res4a"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res4a"
+  top: "res4a"
+  name: "res4a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4a"
+  top: "res4b_branch2a"
+  name: "res4b_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2a"
+  name: "bn4b_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2a"
+  name: "scale4b_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2a"
+  name: "res4b_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2b"
+  name: "res4b_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2b"
+  name: "bn4b_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2b"
+  name: "scale4b_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2b"
+  name: "res4b_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2c"
+  name: "res4b_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4b_branch2c"
+  top: "res4b_branch2c"
+  name: "bn4b_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4b_branch2c"
+  top: "res4b_branch2c"
+  name: "scale4b_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4a"
+  bottom: "res4b_branch2c"
+  top: "res4b"
+  name: "res4b"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res4b"
+  top: "res4b"
+  name: "res4b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4b"
+  top: "res4c_branch2a"
+  name: "res4c_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2a"
+  name: "bn4c_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2a"
+  name: "scale4c_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2a"
+  name: "res4c_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2b"
+  name: "res4c_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2b"
+  name: "bn4c_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2b"
+  name: "scale4c_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2b"
+  name: "res4c_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2c"
+  name: "res4c_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4c_branch2c"
+  top: "res4c_branch2c"
+  name: "bn4c_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4c_branch2c"
+  top: "res4c_branch2c"
+  name: "scale4c_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4b"
+  bottom: "res4c_branch2c"
+  top: "res4c"
+  name: "res4c"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res4c"
+  top: "res4c"
+  name: "res4c_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4c"
+  top: "res4d_branch2a"
+  name: "res4d_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2a"
+  name: "bn4d_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2a"
+  name: "scale4d_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2a"
+  name: "res4d_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2b"
+  name: "res4d_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2b"
+  name: "bn4d_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2b"
+  name: "scale4d_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2b"
+  name: "res4d_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2c"
+  name: "res4d_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4d_branch2c"
+  top: "res4d_branch2c"
+  name: "bn4d_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4d_branch2c"
+  top: "res4d_branch2c"
+  name: "scale4d_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4c"
+  bottom: "res4d_branch2c"
+  top: "res4d"
+  name: "res4d"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res4d"
+  top: "res4d"
+  name: "res4d_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4d"
+  top: "res4e_branch2a"
+  name: "res4e_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2a"
+  name: "bn4e_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2a"
+  name: "scale4e_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2a"
+  name: "res4e_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2b"
+  name: "res4e_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2b"
+  name: "bn4e_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2b"
+  name: "scale4e_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2b"
+  name: "res4e_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2c"
+  name: "res4e_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4e_branch2c"
+  top: "res4e_branch2c"
+  name: "bn4e_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4e_branch2c"
+  top: "res4e_branch2c"
+  name: "scale4e_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4d"
+  bottom: "res4e_branch2c"
+  top: "res4e"
+  name: "res4e"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res4e"
+  top: "res4e"
+  name: "res4e_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4e"
+  top: "res4f_branch2a"
+  name: "res4f_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2a"
+  name: "bn4f_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2a"
+  name: "scale4f_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2a"
+  name: "res4f_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2b"
+  name: "res4f_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 256
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2b"
+  name: "bn4f_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2b"
+  name: "scale4f_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2b"
+  name: "res4f_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2c"
+  name: "res4f_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 1024
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res4f_branch2c"
+  top: "res4f_branch2c"
+  name: "bn4f_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+  filler { value: 0 }
+  }
+}
+
+layer {
+  bottom: "res4f_branch2c"
+  top: "res4f_branch2c"
+  name: "scale4f_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4e"
+  bottom: "res4f_branch2c"
+  top: "res4f"
+  name: "res4f"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res4f"
+  top: "res4f"
+  name: "res4f_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res4f"
+  top: "res5a_branch1"
+  name: "res5a_branch1"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 2048
+    kernel_size: 1
+    pad: 0
+    stride: 2
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5a_branch1"
+  top: "res5a_branch1"
+  name: "bn5a_branch1"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5a_branch1"
+  top: "res5a_branch1"
+  name: "scale5a_branch1"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res4f"
+  top: "res5a_branch2a"
+  name: "res5a_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2a"
+  name: "bn5a_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2a"
+  name: "scale5a_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2a"
+  name: "res5a_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2b"
+  name: "res5a_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 3
+    pad: 1
+    stride: 2
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2b"
+  name: "bn5a_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2b"
+  name: "scale5a_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2b"
+  name: "res5a_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2c"
+  name: "res5a_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 2048
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5a_branch2c"
+  top: "res5a_branch2c"
+  name: "bn5a_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5a_branch2c"
+  top: "res5a_branch2c"
+  name: "scale5a_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5a_branch1"
+  bottom: "res5a_branch2c"
+  top: "res5a"
+  name: "res5a"
+  type: "Eltwise"
+  eltwise_param {
+
+  }
+}
+
+layer {
+  bottom: "res5a"
+  top: "res5a"
+  name: "res5a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5a"
+  top: "res5b_branch2a"
+  name: "res5b_branch2a"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2a"
+  name: "bn5b_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2a"
+  name: "scale5b_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2a"
+  name: "res5b_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2b"
+  name: "res5b_branch2b"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 512
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2b"
+  name: "bn5b_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2b"
+  name: "scale5b_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2b"
+  name: "res5b_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2c"
+  name: "res5b_branch2c"
+  type: "Convolution"
+  convolution_param {
+
+    num_output: 2048
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5b_branch2c"
+  top: "res5b_branch2c"
+  name: "bn5b_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5b_branch2c"
+  top: "res5b_branch2c"
+  name: "scale5b_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5a"
+  bottom: "res5b_branch2c"
+  top: "res5b"
+  name: "res5b"
+  type: "Eltwise"
+  eltwise_param {
+  }
+}
+
+layer {
+  bottom: "res5b"
+  top: "res5b"
+  name: "res5b_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5b"
+  top: "res5c_branch2a"
+  name: "res5c_branch2a"
+  type: "Convolution"
+  convolution_param {
+    num_output: 512
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2a"
+  name: "bn5c_branch2a"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2a"
+  name: "scale5c_branch2a"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2a"
+  name: "res5c_branch2a_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2b"
+  name: "res5c_branch2b"
+  type: "Convolution"
+  convolution_param {
+    num_output: 512
+    kernel_size: 3
+    pad: 1
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2b"
+  name: "bn5c_branch2b"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+    filler { value: 1 }
+  }
+}
+
+layer {
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2b"
+  name: "scale5c_branch2b"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2b"
+  name: "res5c_branch2b_relu"
+  type: "ReLU"
+  relu_param {
+  }
+}
+
+layer {
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2c"
+  name: "res5c_branch2c"
+  type: "Convolution"
+  convolution_param {
+    num_output: 2048
+    kernel_size: 1
+    pad: 0
+    stride: 1
+    bias_term: false
+    weight_filler {
+      type: "msra"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "res5c_branch2c"
+  top: "res5c_branch2c"
+  name: "bn5c_branch2c"
+  type: "BatchNorm"
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  param { lr_mult: 0 }
+  batch_norm_param {
+    moving_average_fraction: 0.9
+  filler { value: 0 }
+  }
+}
+
+layer {
+  bottom: "res5c_branch2c"
+  top: "res5c_branch2c"
+  name: "scale5c_branch2c"
+  type: "Scale"
+  param { decay_mult: 0 }
+  param { decay_mult: 0 }
+  scale_param {
+    bias_term: true
+  }
+}
+
+layer {
+  bottom: "res5b"
+  bottom: "res5c_branch2c"
+  top: "res5c"
+  name: "res5c"
+  type: "Eltwise"
+  eltwise_param {
+  }
+}
+
+layer {
+  bottom: "res5c"
+  top: "res5c"
+  name: "res5c_relu"
+  type: "ReLU"
+  relu_param {
+
+  }
+}
+
+layer {
+  bottom: "res5c"
+  top: "pool5"
+  name: "pool5"
+  type: "Pooling"
+  pooling_param {
+    kernel_size: 7
+    stride: 1
+    pool: AVE
+  }
+}
+
+layer {
+  bottom: "pool5"
+  top: "fc1000"
+  name: "fc1000"
+  type: "InnerProduct"
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+
+layer {
+  bottom: "fc1000"
+  bottom: "label"
+  top: "loss"
+  name: "prob"
+  type: "SoftmaxWithLoss"
+}
+layer {
+  name: "loss3/top-1"
+  type: "Accuracy"
+  bottom: "fc1000"
+  bottom: "label"
+  top: "loss3/top-1"
+}
+layer {
+  name: "loss3/top-5"
+  type: "Accuracy"
+  bottom: "fc1000"
+  bottom: "label"
+  top: "loss3/top-5"
+  accuracy_param {
+    top_k: 5
+  }
+}
diff --git a/models/intel_optimized_models/resnet_50/train_val_dummydata.prototxt b/models/intel_optimized_models/resnet_50/train_val_dummydata.prototxt
new file mode 100644
index 000000000..ba298f468
--- /dev/null
+++ b/models/intel_optimized_models/resnet_50/train_val_dummydata.prototxt
@@ -0,0 +1,3051 @@
+name: "ResNet-50"
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "data"
+  include {
+    phase: TRAIN
+  }
+  dummy_data_param {
+    shape: { dim: 32 dim: 3 dim: 224 dim: 224 }
+    data_filler {
+      type: "constant"
+      value: 0.01
+    }
+  }
+}
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "label"
+  include {
+    phase: TRAIN
+  }
+  dummy_data_param {
+    shape: { dim: 32  }
+    data_filler {
+      type: "constant"
+    }
+  }
+}
+
+layer {
+	bottom: "data"
+	top: "conv1"
+	name: "conv1"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 64
+		kernel_size: 7
+		pad: 3
+		stride: 2
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "conv1"
+	top: "conv1"
+	name: "bn_conv1"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+
+	}
+}
+
+layer {
+	bottom: "conv1"
+	top: "conv1"
+	name: "scale_conv1"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "conv1"
+	top: "conv1"
+	name: "conv1_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "conv1"
+	top: "pool1"
+	name: "pool1"
+	type: "Pooling"
+	pooling_param {
+    
+		kernel_size: 3
+		stride: 2
+		pool: MAX
+	}
+}
+
+layer {
+	bottom: "pool1"
+	top: "res2a_branch1"
+	name: "res2a_branch1"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res2a_branch1"
+	top: "res2a_branch1"
+	name: "bn2a_branch1"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+
+	}
+}
+
+layer {
+	bottom: "res2a_branch1"
+	top: "res2a_branch1"
+	name: "scale2a_branch1"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "pool1"
+	top: "res2a_branch2a"
+	name: "res2a_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 64
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res2a_branch2a"
+	top: "res2a_branch2a"
+	name: "bn2a_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+
+	}
+}
+
+layer {
+	bottom: "res2a_branch2a"
+	top: "res2a_branch2a"
+	name: "scale2a_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res2a_branch2a"
+	top: "res2a_branch2a"
+	name: "res2a_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res2a_branch2a"
+	top: "res2a_branch2b"
+	name: "res2a_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 64
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res2a_branch2b"
+	top: "res2a_branch2b"
+	name: "bn2a_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+
+	}
+}
+
+layer {
+	bottom: "res2a_branch2b"
+	top: "res2a_branch2b"
+	name: "scale2a_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res2a_branch2b"
+	top: "res2a_branch2b"
+	name: "res2a_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res2a_branch2b"
+	top: "res2a_branch2c"
+	name: "res2a_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res2a_branch2c"
+	top: "res2a_branch2c"
+	name: "bn2a_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res2a_branch2c"
+	top: "res2a_branch2c"
+	name: "scale2a_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res2a_branch1"
+	bottom: "res2a_branch2c"
+	top: "res2a"
+	name: "res2a"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res2a"
+	top: "res2a"
+	name: "res2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res2a"
+	top: "res2b_branch2a"
+	name: "res2b_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 64
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res2b_branch2a"
+	top: "res2b_branch2a"
+	name: "bn2b_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res2b_branch2a"
+	top: "res2b_branch2a"
+	name: "scale2b_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res2b_branch2a"
+	top: "res2b_branch2a"
+	name: "res2b_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res2b_branch2a"
+	top: "res2b_branch2b"
+	name: "res2b_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 64
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res2b_branch2b"
+	top: "res2b_branch2b"
+	name: "bn2b_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res2b_branch2b"
+	top: "res2b_branch2b"
+	name: "scale2b_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res2b_branch2b"
+	top: "res2b_branch2b"
+	name: "res2b_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res2b_branch2b"
+	top: "res2b_branch2c"
+	name: "res2b_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res2b_branch2c"
+	top: "res2b_branch2c"
+	name: "bn2b_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res2b_branch2c"
+	top: "res2b_branch2c"
+	name: "scale2b_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res2a"
+	bottom: "res2b_branch2c"
+	top: "res2b"
+	name: "res2b"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res2b"
+	top: "res2b"
+	name: "res2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res2b"
+	top: "res2c_branch2a"
+	name: "res2c_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 64
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res2c_branch2a"
+	top: "res2c_branch2a"
+	name: "bn2c_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res2c_branch2a"
+	top: "res2c_branch2a"
+	name: "scale2c_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res2c_branch2a"
+	top: "res2c_branch2a"
+	name: "res2c_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res2c_branch2a"
+	top: "res2c_branch2b"
+	name: "res2c_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 64
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res2c_branch2b"
+	top: "res2c_branch2b"
+	name: "bn2c_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res2c_branch2b"
+	top: "res2c_branch2b"
+	name: "scale2c_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res2c_branch2b"
+	top: "res2c_branch2b"
+	name: "res2c_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res2c_branch2b"
+	top: "res2c_branch2c"
+	name: "res2c_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res2c_branch2c"
+	top: "res2c_branch2c"
+	name: "bn2c_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res2c_branch2c"
+	top: "res2c_branch2c"
+	name: "scale2c_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res2b"
+	bottom: "res2c_branch2c"
+	top: "res2c"
+	name: "res2c"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res2c"
+	top: "res2c"
+	name: "res2c_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res2c"
+	top: "res3a_branch1"
+	name: "res3a_branch1"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 512
+		kernel_size: 1
+		pad: 0
+		stride: 2
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res3a_branch1"
+	top: "res3a_branch1"
+	name: "bn3a_branch1"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res3a_branch1"
+	top: "res3a_branch1"
+	name: "scale3a_branch1"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res2c"
+	top: "res3a_branch2a"
+	name: "res3a_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 128
+		kernel_size: 1
+		pad: 0
+		stride: 2
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res3a_branch2a"
+	top: "res3a_branch2a"
+	name: "bn3a_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res3a_branch2a"
+	top: "res3a_branch2a"
+	name: "scale3a_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res3a_branch2a"
+	top: "res3a_branch2a"
+	name: "res3a_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3a_branch2a"
+	top: "res3a_branch2b"
+	name: "res3a_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 128
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res3a_branch2b"
+	top: "res3a_branch2b"
+	name: "bn3a_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res3a_branch2b"
+	top: "res3a_branch2b"
+	name: "scale3a_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res3a_branch2b"
+	top: "res3a_branch2b"
+	name: "res3a_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3a_branch2b"
+	top: "res3a_branch2c"
+	name: "res3a_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 512
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res3a_branch2c"
+	top: "res3a_branch2c"
+	name: "bn3a_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res3a_branch2c"
+	top: "res3a_branch2c"
+	name: "scale3a_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res3a_branch1"
+	bottom: "res3a_branch2c"
+	top: "res3a"
+	name: "res3a"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3a"
+	top: "res3a"
+	name: "res3a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3a"
+	top: "res3b_branch2a"
+	name: "res3b_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 128
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res3b_branch2a"
+	top: "res3b_branch2a"
+	name: "bn3b_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res3b_branch2a"
+	top: "res3b_branch2a"
+	name: "scale3b_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res3b_branch2a"
+	top: "res3b_branch2a"
+	name: "res3b_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3b_branch2a"
+	top: "res3b_branch2b"
+	name: "res3b_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 128
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res3b_branch2b"
+	top: "res3b_branch2b"
+	name: "bn3b_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res3b_branch2b"
+	top: "res3b_branch2b"
+	name: "scale3b_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res3b_branch2b"
+	top: "res3b_branch2b"
+	name: "res3b_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3b_branch2b"
+	top: "res3b_branch2c"
+	name: "res3b_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 512
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res3b_branch2c"
+	top: "res3b_branch2c"
+	name: "bn3b_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res3b_branch2c"
+	top: "res3b_branch2c"
+	name: "scale3b_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res3a"
+	bottom: "res3b_branch2c"
+	top: "res3b"
+	name: "res3b"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3b"
+	top: "res3b"
+	name: "res3b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3b"
+	top: "res3c_branch2a"
+	name: "res3c_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 128
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res3c_branch2a"
+	top: "res3c_branch2a"
+	name: "bn3c_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res3c_branch2a"
+	top: "res3c_branch2a"
+	name: "scale3c_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res3c_branch2a"
+	top: "res3c_branch2a"
+	name: "res3c_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3c_branch2a"
+	top: "res3c_branch2b"
+	name: "res3c_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 128
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res3c_branch2b"
+	top: "res3c_branch2b"
+	name: "bn3c_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res3c_branch2b"
+	top: "res3c_branch2b"
+	name: "scale3c_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res3c_branch2b"
+	top: "res3c_branch2b"
+	name: "res3c_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3c_branch2b"
+	top: "res3c_branch2c"
+	name: "res3c_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 512
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res3c_branch2c"
+	top: "res3c_branch2c"
+	name: "bn3c_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res3c_branch2c"
+	top: "res3c_branch2c"
+	name: "scale3c_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res3b"
+	bottom: "res3c_branch2c"
+	top: "res3c"
+	name: "res3c"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3c"
+	top: "res3c"
+	name: "res3c_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3c"
+	top: "res3d_branch2a"
+	name: "res3d_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 128
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res3d_branch2a"
+	top: "res3d_branch2a"
+	name: "bn3d_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res3d_branch2a"
+	top: "res3d_branch2a"
+	name: "scale3d_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res3d_branch2a"
+	top: "res3d_branch2a"
+	name: "res3d_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3d_branch2a"
+	top: "res3d_branch2b"
+	name: "res3d_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 128
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res3d_branch2b"
+	top: "res3d_branch2b"
+	name: "bn3d_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res3d_branch2b"
+	top: "res3d_branch2b"
+	name: "scale3d_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res3d_branch2b"
+	top: "res3d_branch2b"
+	name: "res3d_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3d_branch2b"
+	top: "res3d_branch2c"
+	name: "res3d_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 512
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res3d_branch2c"
+	top: "res3d_branch2c"
+	name: "bn3d_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res3d_branch2c"
+	top: "res3d_branch2c"
+	name: "scale3d_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res3c"
+	bottom: "res3d_branch2c"
+	top: "res3d"
+	name: "res3d"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3d"
+	top: "res3d"
+	name: "res3d_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res3d"
+	top: "res4a_branch1"
+	name: "res4a_branch1"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 1024
+		kernel_size: 1
+		pad: 0
+		stride: 2
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4a_branch1"
+	top: "res4a_branch1"
+	name: "bn4a_branch1"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4a_branch1"
+	top: "res4a_branch1"
+	name: "scale4a_branch1"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res3d"
+	top: "res4a_branch2a"
+	name: "res4a_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 1
+		pad: 0
+		stride: 2
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4a_branch2a"
+	top: "res4a_branch2a"
+	name: "bn4a_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4a_branch2a"
+	top: "res4a_branch2a"
+	name: "scale4a_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4a_branch2a"
+	top: "res4a_branch2a"
+	name: "res4a_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4a_branch2a"
+	top: "res4a_branch2b"
+	name: "res4a_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4a_branch2b"
+	top: "res4a_branch2b"
+	name: "bn4a_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4a_branch2b"
+	top: "res4a_branch2b"
+	name: "scale4a_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4a_branch2b"
+	top: "res4a_branch2b"
+	name: "res4a_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4a_branch2b"
+	top: "res4a_branch2c"
+	name: "res4a_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 1024
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4a_branch2c"
+	top: "res4a_branch2c"
+	name: "bn4a_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4a_branch2c"
+	top: "res4a_branch2c"
+	name: "scale4a_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4a_branch1"
+	bottom: "res4a_branch2c"
+	top: "res4a"
+	name: "res4a"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4a"
+	top: "res4a"
+	name: "res4a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4a"
+	top: "res4b_branch2a"
+	name: "res4b_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4b_branch2a"
+	top: "res4b_branch2a"
+	name: "bn4b_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4b_branch2a"
+	top: "res4b_branch2a"
+	name: "scale4b_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4b_branch2a"
+	top: "res4b_branch2a"
+	name: "res4b_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4b_branch2a"
+	top: "res4b_branch2b"
+	name: "res4b_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4b_branch2b"
+	top: "res4b_branch2b"
+	name: "bn4b_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4b_branch2b"
+	top: "res4b_branch2b"
+	name: "scale4b_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4b_branch2b"
+	top: "res4b_branch2b"
+	name: "res4b_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4b_branch2b"
+	top: "res4b_branch2c"
+	name: "res4b_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 1024
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4b_branch2c"
+	top: "res4b_branch2c"
+	name: "bn4b_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4b_branch2c"
+	top: "res4b_branch2c"
+	name: "scale4b_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4a"
+	bottom: "res4b_branch2c"
+	top: "res4b"
+	name: "res4b"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4b"
+	top: "res4b"
+	name: "res4b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4b"
+	top: "res4c_branch2a"
+	name: "res4c_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4c_branch2a"
+	top: "res4c_branch2a"
+	name: "bn4c_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4c_branch2a"
+	top: "res4c_branch2a"
+	name: "scale4c_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4c_branch2a"
+	top: "res4c_branch2a"
+	name: "res4c_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4c_branch2a"
+	top: "res4c_branch2b"
+	name: "res4c_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4c_branch2b"
+	top: "res4c_branch2b"
+	name: "bn4c_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4c_branch2b"
+	top: "res4c_branch2b"
+	name: "scale4c_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4c_branch2b"
+	top: "res4c_branch2b"
+	name: "res4c_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4c_branch2b"
+	top: "res4c_branch2c"
+	name: "res4c_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 1024
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4c_branch2c"
+	top: "res4c_branch2c"
+	name: "bn4c_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4c_branch2c"
+	top: "res4c_branch2c"
+	name: "scale4c_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4b"
+	bottom: "res4c_branch2c"
+	top: "res4c"
+	name: "res4c"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4c"
+	top: "res4c"
+	name: "res4c_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4c"
+	top: "res4d_branch2a"
+	name: "res4d_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4d_branch2a"
+	top: "res4d_branch2a"
+	name: "bn4d_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4d_branch2a"
+	top: "res4d_branch2a"
+	name: "scale4d_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4d_branch2a"
+	top: "res4d_branch2a"
+	name: "res4d_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4d_branch2a"
+	top: "res4d_branch2b"
+	name: "res4d_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4d_branch2b"
+	top: "res4d_branch2b"
+	name: "bn4d_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4d_branch2b"
+	top: "res4d_branch2b"
+	name: "scale4d_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4d_branch2b"
+	top: "res4d_branch2b"
+	name: "res4d_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4d_branch2b"
+	top: "res4d_branch2c"
+	name: "res4d_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 1024
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4d_branch2c"
+	top: "res4d_branch2c"
+	name: "bn4d_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4d_branch2c"
+	top: "res4d_branch2c"
+	name: "scale4d_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4c"
+	bottom: "res4d_branch2c"
+	top: "res4d"
+	name: "res4d"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4d"
+	top: "res4d"
+	name: "res4d_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4d"
+	top: "res4e_branch2a"
+	name: "res4e_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4e_branch2a"
+	top: "res4e_branch2a"
+	name: "bn4e_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4e_branch2a"
+	top: "res4e_branch2a"
+	name: "scale4e_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4e_branch2a"
+	top: "res4e_branch2a"
+	name: "res4e_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4e_branch2a"
+	top: "res4e_branch2b"
+	name: "res4e_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4e_branch2b"
+	top: "res4e_branch2b"
+	name: "bn4e_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4e_branch2b"
+	top: "res4e_branch2b"
+	name: "scale4e_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4e_branch2b"
+	top: "res4e_branch2b"
+	name: "res4e_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4e_branch2b"
+	top: "res4e_branch2c"
+	name: "res4e_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 1024
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4e_branch2c"
+	top: "res4e_branch2c"
+	name: "bn4e_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4e_branch2c"
+	top: "res4e_branch2c"
+	name: "scale4e_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4d"
+	bottom: "res4e_branch2c"
+	top: "res4e"
+	name: "res4e"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4e"
+	top: "res4e"
+	name: "res4e_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4e"
+	top: "res4f_branch2a"
+	name: "res4f_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4f_branch2a"
+	top: "res4f_branch2a"
+	name: "bn4f_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4f_branch2a"
+	top: "res4f_branch2a"
+	name: "scale4f_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4f_branch2a"
+	top: "res4f_branch2a"
+	name: "res4f_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4f_branch2a"
+	top: "res4f_branch2b"
+	name: "res4f_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 256
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4f_branch2b"
+	top: "res4f_branch2b"
+	name: "bn4f_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4f_branch2b"
+	top: "res4f_branch2b"
+	name: "scale4f_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4f_branch2b"
+	top: "res4f_branch2b"
+	name: "res4f_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4f_branch2b"
+	top: "res4f_branch2c"
+	name: "res4f_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 1024
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res4f_branch2c"
+	top: "res4f_branch2c"
+	name: "bn4f_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res4f_branch2c"
+	top: "res4f_branch2c"
+	name: "scale4f_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4e"
+	bottom: "res4f_branch2c"
+	top: "res4f"
+	name: "res4f"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4f"
+	top: "res4f"
+	name: "res4f_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res4f"
+	top: "res5a_branch1"
+	name: "res5a_branch1"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 2048
+		kernel_size: 1
+		pad: 0
+		stride: 2
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res5a_branch1"
+	top: "res5a_branch1"
+	name: "bn5a_branch1"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res5a_branch1"
+	top: "res5a_branch1"
+	name: "scale5a_branch1"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res4f"
+	top: "res5a_branch2a"
+	name: "res5a_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 512
+		kernel_size: 1
+		pad: 0
+		stride: 2
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res5a_branch2a"
+	top: "res5a_branch2a"
+	name: "bn5a_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res5a_branch2a"
+	top: "res5a_branch2a"
+	name: "scale5a_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res5a_branch2a"
+	top: "res5a_branch2a"
+	name: "res5a_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res5a_branch2a"
+	top: "res5a_branch2b"
+	name: "res5a_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 512
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res5a_branch2b"
+	top: "res5a_branch2b"
+	name: "bn5a_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res5a_branch2b"
+	top: "res5a_branch2b"
+	name: "scale5a_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res5a_branch2b"
+	top: "res5a_branch2b"
+	name: "res5a_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res5a_branch2b"
+	top: "res5a_branch2c"
+	name: "res5a_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 2048
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res5a_branch2c"
+	top: "res5a_branch2c"
+	name: "bn5a_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res5a_branch2c"
+	top: "res5a_branch2c"
+	name: "scale5a_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res5a_branch1"
+	bottom: "res5a_branch2c"
+	top: "res5a"
+	name: "res5a"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res5a"
+	top: "res5a"
+	name: "res5a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res5a"
+	top: "res5b_branch2a"
+	name: "res5b_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 512
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res5b_branch2a"
+	top: "res5b_branch2a"
+	name: "bn5b_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res5b_branch2a"
+	top: "res5b_branch2a"
+	name: "scale5b_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res5b_branch2a"
+	top: "res5b_branch2a"
+	name: "res5b_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res5b_branch2a"
+	top: "res5b_branch2b"
+	name: "res5b_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 512
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res5b_branch2b"
+	top: "res5b_branch2b"
+	name: "bn5b_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res5b_branch2b"
+	top: "res5b_branch2b"
+	name: "scale5b_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res5b_branch2b"
+	top: "res5b_branch2b"
+	name: "res5b_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res5b_branch2b"
+	top: "res5b_branch2c"
+	name: "res5b_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 2048
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res5b_branch2c"
+	top: "res5b_branch2c"
+	name: "bn5b_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res5b_branch2c"
+	top: "res5b_branch2c"
+	name: "scale5b_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res5a"
+	bottom: "res5b_branch2c"
+	top: "res5b"
+	name: "res5b"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res5b"
+	top: "res5b"
+	name: "res5b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res5b"
+	top: "res5c_branch2a"
+	name: "res5c_branch2a"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 512
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res5c_branch2a"
+	top: "res5c_branch2a"
+	name: "bn5c_branch2a"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res5c_branch2a"
+	top: "res5c_branch2a"
+	name: "scale5c_branch2a"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res5c_branch2a"
+	top: "res5c_branch2a"
+	name: "res5c_branch2a_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res5c_branch2a"
+	top: "res5c_branch2b"
+	name: "res5c_branch2b"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 512
+		kernel_size: 3
+		pad: 1
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res5c_branch2b"
+	top: "res5c_branch2b"
+	name: "bn5c_branch2b"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res5c_branch2b"
+	top: "res5c_branch2b"
+	name: "scale5c_branch2b"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res5c_branch2b"
+	top: "res5c_branch2b"
+	name: "res5c_branch2b_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res5c_branch2b"
+	top: "res5c_branch2c"
+	name: "res5c_branch2c"
+	type: "Convolution"
+	convolution_param {
+    
+		num_output: 2048
+		kernel_size: 1
+		pad: 0
+		stride: 1
+		bias_term: false
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0.2
+    	       }
+	}
+}
+
+layer {
+	bottom: "res5c_branch2c"
+	top: "res5c_branch2c"
+	name: "bn5c_branch2c"
+	type: "BatchNorm"
+	batch_norm_param {
+    
+		
+	}
+}
+
+layer {
+	bottom: "res5c_branch2c"
+	top: "res5c_branch2c"
+	name: "scale5c_branch2c"
+	type: "Scale"
+	scale_param {
+		bias_term: true
+	}
+}
+
+layer {
+	bottom: "res5b"
+	bottom: "res5c_branch2c"
+	top: "res5c"
+	name: "res5c"
+	type: "Eltwise"
+  eltwise_param {
+    
+  }
+}
+
+layer {
+	bottom: "res5c"
+	top: "res5c"
+	name: "res5c_relu"
+	type: "ReLU"
+  relu_param {
+    
+  }
+}
+
+layer {
+	bottom: "res5c"
+	top: "pool5"
+	name: "pool5"
+	type: "Pooling"
+	pooling_param {
+    
+		kernel_size: 7
+		stride: 1
+		pool: AVE
+	}
+}
+
+layer {
+	bottom: "pool5"
+	top: "fc1000"
+	name: "fc1000"
+	type: "InnerProduct"
+	inner_product_param {
+		num_output: 1000
+		weight_filler {
+      		  type: "xavier"
+    		}
+    		bias_filler {
+      		  type: "constant"
+      		  value: 0
+    	        }
+	}
+}
+
+layer {
+	bottom: "fc1000"
+	bottom: "label"
+	top: "prob"
+	name: "prob"
+	type: "SoftmaxWithLoss"
+	include {
+	  phase: TRAIN
+	}
+}
+layer {
+  name: "loss3/top-1"
+  type: "Accuracy"
+  bottom: "fc1000"
+  bottom: "label"
+  top: "loss3/top-1"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  name: "loss3/top-5"
+  type: "Accuracy"
+  bottom: "fc1000"
+  bottom: "label"
+  top: "loss3/top-5"
+  include {
+    phase: TEST
+  }
+  accuracy_param {
+    top_k: 5
+  }
+}
diff --git a/scripts/benchmark_config_template.json b/scripts/benchmark_config_template.json
new file mode 100644
index 000000000..440939c62
--- /dev/null
+++ b/scripts/benchmark_config_template.json
@@ -0,0 +1,38 @@
+{
+    "params":{
+        "topology" : "your topology like alexnet/googlenet/googlenet_v2/resnet_50/all",
+        "hostfile" : "/your/hostfile",
+        "network" : "tcp or opa",
+        "netmask" : "your ethernet card name like eth0",
+        "dummy_data_use" : true,
+        "scal_test" : false,
+        "caffe_bin" : "",
+        "engine" : "choose CAFFE, MKL2017 or MKLDNN"
+    },
+    "batch_size_table" : {
+        "alexnet" : {
+            "bdw" : "1024",
+            "skx" : "1024",
+            "knl" : "512",
+            "knm" : "1024"
+        },
+        "googlenet" : {
+            "bdw" : "128",
+            "skx" : "144",
+            "knl" : "144",
+            "knm" : "144"
+        },
+        "googlenet_v2" : {
+            "bdw" : "128",
+            "skx" : "192",
+            "knl" : "192",
+            "knm" : "128"
+        },
+        "resnet_50" : {
+            "bdw" : "32",
+            "skx" : "96",
+            "knl" : "64",
+            "knm" : "64"
+        }
+    }
+} 
diff --git a/scripts/run_benchmark.py b/scripts/run_benchmark.py
new file mode 100755
index 000000000..7f67764e0
--- /dev/null
+++ b/scripts/run_benchmark.py
@@ -0,0 +1,369 @@
+import subprocess
+import argparse
+import re
+import os
+import time
+import json
+import socket
+import logging
+
+topology_list = ["alexnet", "googlenet", "googlenet_v2", "resnet_50", 'all']
+class CaffeBenchmark(object):
+    '''Used to do caffe benchmarking'''
+    def __init__(self, topology, bkm_batch_size, host_file = "", network = "", tcp_netmask = "", engine = "", dummy_data_use = True, caffe_bin = "", scal_test = True):
+        '''params initialization'''
+        self.topology = topology
+        self.host_file = host_file
+        self.network = network
+        self.tcp_netmask = tcp_netmask
+        self.dummy_data_use = dummy_data_use
+        self.engine = engine
+        self.caffe_bin = caffe_bin
+        self.scal_test = scal_test
+        self.num_nodes = 1
+        self.cpu_model = "skx"
+        # flag used to mark if we have detected which cpu model we're using
+        self.unknown_cpu = False
+        self.iterations = 100
+        self.caffe_root = os.path.dirname(os.path.dirname(__file__))
+        # model template path
+        self.model_path = self.caffe_root + "models/intel_optimized_models"
+        # specific script used to run intelcaffe 
+        self.caffe_run_script = self.caffe_root + "scripts/run_intelcaffe.sh"
+        self.bkm_batch_size = bkm_batch_size
+        self.check_parameters()
+        current_time = time.strftime("%Y%m%d%H%M%S")
+        logging.basicConfig(filename = 'result-benchmark-{}.log'.format(current_time),level = logging.INFO)
+
+    def is_supported_topology(self):
+        '''check if input topology is supported'''
+        if self.topology not in topology_list:
+            logging.exception("The topology you specified as {} is not supported. Supported topologies are {}".format(self.topology, topology_list))
+    
+    def calculate_numnodes(self):
+        '''calculate current using nodes'''
+        if os.path.isfile(self.host_file):
+            with open(self.host_file, 'r') as f:
+                self.num_nodes = len([line for line in f.readlines() if line.strip() != ''])
+                if self.num_nodes == 0:
+                    logging.exception("Error: empty host list. Exit.")
+        return self.num_nodes
+    
+    def _exec_command(self, cmd):
+        '''execute shell command'''
+        return subprocess.check_output(cmd, stderr = subprocess.STDOUT, shell = True)
+
+    def _exec_command_and_show(self, cmd):
+        '''execute shell command and print it out'''
+        def _exec_command_and_iter_show(cmd):
+            out = subprocess.Popen(cmd, shell = True, stdin = subprocess.PIPE, stdout = subprocess.PIPE, stderr = subprocess.PIPE, universal_newlines = True)
+            for stdout_line in iter(out.stdout.readline, ""):
+                yield stdout_line
+            return_code = out.wait()
+            if return_code:
+                raise subprocess.CalledProcessError(return_code, cmd)
+        for line in _exec_command_and_iter_show(cmd):
+            print line
+        
+    
+    def detect_cpu(self):
+        '''check which IA platform currently using'''
+        command_name = "lscpu | grep 'Model name' | awk -F ':' '{print $2}'"
+        model_string = self._exec_command(command_name)
+        self.model_string = model_string
+        #will make it configurable in the future
+        knl_pattern = re.compile(".*72[1359]0.*")
+        knm_pattern = re.compile(".*72.*")
+        skx_pattern = re.compile(".*[86543]1.*")
+        bdw_pattern = re.compile(".*(E5-[421]6|E7-[84]8|E3-12|D-?15).*")
+        if re.match(knl_pattern, model_string):
+            self.cpu_model = "knl"
+        elif re.match(knm_pattern, model_string):
+            self.cpu_model = "knm"
+        elif re.match(skx_pattern, model_string):
+            self.cpu_model = "skx"
+        elif re.match(bdw_pattern, model_string):
+            self.cpu_model = "bdw"
+        else:
+            self.unknown_cpu = True
+            logging.info("Can't detect which cpu model currently using, will use default settings, which may not be the optimal one.")
+    
+    def obtain_model_file(self, model):
+        '''change original model file batch size to bkm batch size'''
+        prototxt_file = "train_val_dummydata.prototxt" if self.dummy_data_use else "train_val.prototxt"
+        dst_model_file = "/".join([self.model_path, model, '-'.join([self.cpu_model, prototxt_file])])
+        if os.path.isfile(dst_model_file):
+            os.remove(dst_model_file)
+        src_model_file = "/".join([self.model_path, model, prototxt_file])
+        if not os.path.isfile(src_model_file):
+            logging.exception("template model file {} doesn't exist.".format(src_model_file))
+        batch_size_pattern = re.compile(".*shape:.*") if self.dummy_data_use else re.compile(".*batch size:.*")
+        # we only care about train phase batch size for benchmarking
+        batch_size_cnt = 2 if self.dummy_data_use else 1
+        if model not in self.bkm_batch_size or self.cpu_model not in self.bkm_batch_size[model]:
+            logging.exception("Can't find batch size of topology {} and cpu model {} within batch size table".format(model, self.cpu_model))
+        new_batch_size = self.bkm_batch_size[model][self.cpu_model]
+        with open(src_model_file, 'r') as src_f, open(dst_model_file, 'w') as dst_f:
+            cnt = 0
+            for line in src_f.readlines():
+                if re.match(batch_size_pattern, line) and cnt < batch_size_cnt:
+                   #change batch size
+                    re.sub("[0-9]+", new_batch_size, line, count = 1)
+                    cnt += 1
+                dst_f.write(line) 
+        return dst_model_file
+
+    def obtain_solver_file(self, model):
+        '''obtain suitable solver file for training benchmark'''
+        solver_prototxt_file = "solver_dummydata.prototxt" if self.dummy_data_use else "solver.prototxt"
+        dst_solver_file = "/".join([self.model_path, model, '-'.join([self.cpu_model, solver_prototxt_file])])
+        if os.path.isfile(dst_solver_file):
+            os.remove(dst_solver_file)
+        src_solver_file = "/".join([self.model_path, model, solver_prototxt_file])
+        if not os.path.isfile(src_solver_file):
+            logging.exception("template solver file {} doesn't exist.".format(src_solver_file))
+        dst_model_file = self.obtain_model_file(model)
+        max_iter = "200"
+        display_iter = "1"
+        net_path_pattern = re.compile(".*net:.*")
+        max_iter_pattern = re.compile(".*max_iter:.*")
+        display_pattern = re.compile(".*display:.*")
+        with open(src_solver_file, 'r') as src_f, open(dst_solver_file, 'w') as dst_f:
+            for line in src_f.readlines():
+                if re.match(net_path_pattern, line):
+                    dst_f.write('net: "{}"\n'.format(dst_model_file))
+                elif re.match(max_iter_pattern, line):
+                    dst_f.write('max_iter: {}\n'.format(max_iter))
+                elif re.match(display_pattern, line):
+                    dst_f.write('display: {}\n'.format(display_iter))
+                else:
+                    dst_f.write(line) 
+        return dst_solver_file
+
+    def run_specific_model(self, model):
+        '''run the topology you specified'''
+        self.calculate_numnodes()
+        if self.num_nodes == 1:
+            model_file = self.obtain_model_file(model)
+            exec_command = ' '.join([self.caffe_run_script, '--model_file', model_file, '--mode time', '--iteration', str(self.iterations), '--benchmark none'])
+        else:
+            solver_file = self.obtain_solver_file(model)
+            exec_command = ' '.join([self.caffe_run_script, '--hostfile', self.host_file, '--solver', solver_file, '--network', self.network, '--benchmark none'])
+            if self.network == "tcp":
+                exec_command += " --netmask {}".format(self.tcp_netmask)
+    
+        if self.engine != "":
+            exec_command += " --engine {}".format(self.engine)
+        if self.caffe_bin != "":
+            exec_command += " --caffe_bin {}".format(self.caffe_bin)
+        current_time = time.strftime("%Y%m%d%H%M%S")
+        if not self.unknown_cpu:
+            self.result_log_file = "-".join(["result", self.cpu_model, model, current_time + ".log"])
+        else:
+            self.result_log_file = "-".join(["result", "unknown", model, current_time + ".log"])
+        exec_command += " 2>&1 | tee {}".format(self.result_log_file)
+        self._exec_command_and_show(exec_command)
+        self.intelcaffe_log = self.obtain_intelcaffe_log()
+        self.calculate_fps()
+    
+    def obtain_intelcaffe_log(self):
+        '''obtain the logfile of 'run_intelcaffe' '''
+        logging.info("Result log file: {}".format(self.result_log_file))
+        if not os.path.isfile(self.result_log_file):
+            logging.exception("Couldn't see result log file {}".format(result_log_file))
+        result_dir = ''
+        with open(self.result_log_file, 'r') as f:
+            for line in f.readlines():
+                if line.startswith('Result folder:'):
+                    result_dir = line.split('/')[-1].strip()
+                    break
+        if result_dir == "":
+            logging.exception("Couldn't find result folder within file".format(result_file_log))
+        if not self.unknown_cpu:
+            caffe_log_file = "-".join(["outputCluster", self.cpu_model, str(self.num_nodes) + '.txt'])
+        else:
+            caffe_log_file = "-".join(["outputCluster", "unknown", str(self.num_nodes) + '.txt'])
+        intelcaffe_log = "/".join([result_dir, caffe_log_file])
+        logging.info('intelcaffe log: %s' % intelcaffe_log)
+        return intelcaffe_log
+    
+    def obtain_average_fwd_bwd_time(self):
+        '''obtain average iteration time of training'''
+        result_file = self.intelcaffe_log
+        if not os.path.isfile(result_file):
+            logging.exception("Error: result file {} does not exist...".format(result_file))
+        if self.num_nodes == 1:
+            average_time = ""
+            with open(result_file, 'r') as f:
+                average_fwd_bwd_time_pattern = re.compile(".*Average Forward-Backward:.*")
+                for line in f.readlines():
+                    if re.match(average_fwd_bwd_time_pattern, line):
+                        average_time = line.split()[-2]
+            if average_time == "": 
+                logging.exception("Error: running intelcaffe failed, please check logs under: {}".format(result_file))
+            average_time = float(average_time)
+        else:
+            start_iteration = 100
+            iteration_num = 100
+            total_time = 0.0
+            delta_times = []
+            with open(result_file, 'r') as f:
+                delta_time_pattern = re.compile(".*DELTA TIME.*")
+                for line in f.readlines():
+                    if re.match(delta_time_pattern, line):
+                        delta_times.append(line.split()[-2])
+            if len(delta_times) == 0:
+                logging.exception("Error: check if you mark 'CAFFE_PER_LAYER_TIMINGS := 1' while building caffe; also ensure you're running at least 200 iterations for multinode trainings; or check if you're running intelcaffe failed, the logs can be found under: {}".format(result_file))
+            for delta_time in delta_times[start_iteration : start_iteration + iteration_num]:
+                total_time += float(delta_time)
+            average_time = total_time / iteration_num * 1000.0
+        logging.info("average time: {} ms".format(str(average_time)))
+        return average_time
+    
+    def obtain_batch_size(self):
+        '''obtain global batch size for training'''
+        log_file = self.intelcaffe_log
+        if not os.path.isfile(log_file):
+            logging.exception("Error: log file {} does not exist...".format(log_file))
+        with open(log_file, 'r') as f:
+            batch_size_pattern_time = re.compile(".*SetMinibatchSize.*")
+            batch_size_pattern_dummy = re.compile(".*dim:.*")
+            batch_size_pattern_real = re.compile(".*batch_size:.*")
+            batch_size = ''
+            for line in f.readlines():
+                if re.match(batch_size_pattern_time, line) or re.match(batch_size_pattern_real, line) or re.match(batch_size_pattern_dummy, line):
+                    batch_size = line.split()[-1]
+                    break
+        if batch_size == '':
+            logging.exception("Can't find batch size within your log file: {}".format(log_file))
+        batch_size = int(batch_size) * self.num_nodes
+        logging.info("global batch size: {}".format(str(batch_size)))
+        return float(batch_size)
+    
+    def calculate_fps(self):
+        '''calculate fps here'''
+        self.batch_size = self.obtain_batch_size()
+        self.average_time = self.obtain_average_fwd_bwd_time()
+        speed = self.batch_size * 1000.0 / self.average_time
+        self.speed = int(speed)
+        logging.info("benchmark speed: {} images/sec".format(str(self.speed)))
+        return speed
+    
+    def get_local_ip_lists(self):
+        '''get local ip lists'''
+        exec_command = 'ip addr'
+        out = self._exec_command(exec_command)
+        ip_pattern = re.compile(".*inet [0-9]+.*")
+        self.local_ips = []
+        for line in out.split('\n'):
+            if re.match(ip_pattern, line):
+                ip = line.split()[1].split('/')[0]
+                self.local_ips.append(ip)
+        if len(self.local_ips) == 0:
+            logging.exception("Can't find available ips on local node.")
+        hostname = socket.gethostname()
+        self.local_ips.append(hostname)
+
+    def manipulate_host_file(self):
+        '''put master node ip or hostname on the first one of the host ip or hostname list'''
+        self.get_local_ip_lists()
+        self.hosts = []
+        with open(self.host_file, 'r') as origin_f:
+            for line in origin_f.readlines():
+                self.hosts.append(line.rstrip().lstrip())
+        for index, ip in enumerate(self.hosts):
+            if ip in self.local_ips:
+                self.hosts[0], self.hosts[index] = self.hosts[index], self.hosts[0]
+                break
+        
+        
+    def obtain_host_file(self, num_nodes):
+        '''obtain suitable host file to do scaling test'''
+        dst_host_file = 'scal_hostfile'
+        with open(dst_host_file, 'w') as dst_f:
+            for i in xrange(num_nodes):
+                dst_f.write(self.hosts[i] + '\n')
+        return dst_host_file 
+ 
+    def run_scal_test(self, model):
+        '''scaling test on multinodes'''
+        num_nodes = self.calculate_numnodes()
+        if num_nodes <= 1 or ((num_nodes & (num_nodes - 1))) != 0:
+            logging.exception("nodes number: {} is not a power of 2.".format(num_nodes))
+        self.manipulate_host_file()
+        origin_hostfile = self.host_file
+        fps_table = {}
+        while num_nodes > 0:
+            self.host_file = self.obtain_host_file(num_nodes)
+            self.run_specific_model(model)
+            fps_table[num_nodes] = self.speed
+            num_nodes /= 2
+        # roll back actual num_nodes for possible topology 'all'
+        os.remove(self.host_file)
+        self.host_file = origin_hostfile
+        self.print_scal_test_results(fps_table)
+
+    def print_scal_test_results(self, fps_table):
+        '''print scaling test results out'''
+        logging.info('')
+        logging.info('-------scaling test results----------')
+        logging.info('num_nodes, fps(images/s), scaling efficiency')
+        num_nodes, total_num_nodes = 1, self.calculate_numnodes()
+        while num_nodes <= total_num_nodes:
+            scal_efficiency = round(float(fps_table[num_nodes]) / float((num_nodes * fps_table[1])), 3)
+            logging.info('{}, {}, {}'.format(str(num_nodes), str(fps_table[num_nodes]), str(scal_efficiency)))
+            num_nodes *= 2
+        logging.info('')
+        
+    def run_benchmark(self):
+        '''run intelcaffe training benchmark'''
+        self.detect_cpu()
+        logging.info("Cpu model: {}".format(self.model_string))
+        if self.topology == 'all':
+            for model in topology_list:
+                if model == 'all':
+                    continue
+                logging.info("--{}".format(model))
+                if self.scal_test:
+                    self.run_scal_test(model)
+                else:
+                    self.run_specific_model(model)
+        else:
+            if self.scal_test:
+                self.run_scal_test(self.topology)
+            else:
+                self.run_specific_model(self.topology)
+
+    def check_parameters(self):
+        '''check program parameters'''
+        if self.topology == "":
+            logging.exception("Error: topology is not specified.")
+        self.is_supported_topology()
+        if self.host_file != "":
+            if self.network == "tcp" and self.tcp_netmask == "":
+                logging.exception("Error: need to specify tcp network's netmask")
+
+def main():
+    '''main routine'''
+    arg_parser = argparse.ArgumentParser(description = "Used to run intelcaffe training benchmark")
+    arg_parser.add_argument('--configfile', help = "config file which contains the parameters you want and the batch size you want to use on all topologies and platforms")
+    main_args = arg_parser.parse_args()
+    if main_args.configfile == '' or not os.path.isfile(main_args.configfile):
+        logging.exception("Cant't find config file {}.".format(main_args.configfile))
+    with open(main_args.configfile, 'r') as f:
+        config = json.load(f)
+        topology = config['params']['topology']
+        host_file = config['params']['hostfile']
+        network = config['params']['network']
+        tcp_netmask = config['params']['netmask']
+        engine = config['params']["engine"]
+        dummy_data_use = config['params']['dummy_data_use']
+        scal_test = config['params']['scal_test']
+        caffe_bin = config['params']['caffe_bin']
+        bkm_batch_size = config['batch_size_table']
+    
+    caffe_benchmark = CaffeBenchmark(topology, bkm_batch_size, host_file, network, tcp_netmask, engine, dummy_data_use, caffe_bin, scal_test)
+    caffe_benchmark.run_benchmark()
+
+if __name__ == "__main__":
+    main()

From d2b4ec5cb12aa0e468b414522bc2f1e8abb246d2 Mon Sep 17 00:00:00 2001
From: xiaolil1 <xiaoli.liu@intel.com>
Date: Wed, 3 Jan 2018 06:51:22 +0800
Subject: [PATCH 35/53] Merge int8 implementation from 'prv-inf' branch

---
 include/caffe/layers/mkldnn_layers.hpp        |   45 +-
 include/caffe/mkldnn_base.hpp                 |    5 +-
 include/caffe/mkldnn_memory.hpp               |   92 +-
 include/caffe/net.hpp                         |   19 +-
 include/caffe/quant/base_quant_layer.hpp      |   62 +
 include/caffe/quant/quantization.hpp          |  136 +
 .../int8/inceptionv3_int8.prototxt            | 4568 +++++++++++++++++
 .../int8/resnet50_int8.prototxt               | 3056 +++++++++++
 .../int8/ssd_int8.prototxt                    | 1864 +++++++
 src/caffe/layers/mkldnn_concat_layer.cpp      |   70 +-
 src/caffe/layers/mkldnn_convolution_layer.cpp |  187 +-
 src/caffe/layers/mkldnn_eltwise_layer.cpp     |    8 -
 .../layers/mkldnn_inner_product_layer.cpp     |    2 +-
 src/caffe/layers/mkldnn_lrn_layer.cpp         |   35 +-
 src/caffe/layers/mkldnn_pooling_layer.cpp     |   24 +-
 src/caffe/mkldnn_base.cpp                     |   33 +
 src/caffe/mkldnn_memory.cpp                   |  272 +-
 src/caffe/net.cpp                             |  101 +-
 src/caffe/proto/caffe.proto                   |   23 +-
 src/caffe/quant/layers/base_quant_layer.cpp   |   56 +
 src/caffe/quant/quantization.cpp              |  331 ++
 tools/caffe.cpp                               |    3 +
 tools/sample.cpp                              |  154 +
 23 files changed, 11015 insertions(+), 131 deletions(-)
 create mode 100644 include/caffe/quant/base_quant_layer.hpp
 create mode 100644 include/caffe/quant/quantization.hpp
 create mode 100644 models/intel_optimized_models/int8/inceptionv3_int8.prototxt
 create mode 100644 models/intel_optimized_models/int8/resnet50_int8.prototxt
 create mode 100644 models/intel_optimized_models/int8/ssd_int8.prototxt
 create mode 100644 src/caffe/quant/layers/base_quant_layer.cpp
 create mode 100644 src/caffe/quant/quantization.cpp
 create mode 100644 tools/sample.cpp

diff --git a/include/caffe/layers/mkldnn_layers.hpp b/include/caffe/layers/mkldnn_layers.hpp
index cde342b30..b32fa0a03 100644
--- a/include/caffe/layers/mkldnn_layers.hpp
+++ b/include/caffe/layers/mkldnn_layers.hpp
@@ -59,12 +59,39 @@ using namespace mkldnn;
 
 namespace caffe {
 
+// =====  Log functions ==============================================
+template <typename Dtype>
+inline void info_mem_pd(shared_ptr<memory::primitive_desc> mem_pd, string name) {
+    // format of mem_pda
+//#ifdef DEBUG        
+    LOG(INFO) << name;
+
+    switch (mem_pd->desc().data.format) {
+        case memory::format::nchw: LOG(INFO) << "format: nchw"; break;
+        case memory::format::nhwc: LOG(INFO) << "format: nhwc"; break;
+        case memory::format::nChw8c: LOG(INFO) << "format: nChw8c"; break;
+        case memory::format::nChw16c: LOG(INFO) << "format: nChw16c"; break;
+        case memory::format::nc: LOG(INFO) << "format: nc"; break;
+        default: assert(!"Error format");
+    }
+    // data_type
+    switch (mem_pd->desc().data.data_type) {
+        case memory::data_type::f32: LOG(INFO) << "data_type: f32"; break;
+        case memory::data_type::u8: LOG(INFO) << "data_type: u8"; break;
+        case memory::data_type::s8: LOG(INFO) << "data_type: s8"; break;
+        case memory::data_type::s32: LOG(INFO) << "data_type: s32"; break;
+        default: assert(!"Error data_type");
+    }
+//#endif
+}
+
+
 // =====  MKLDNNBatchNormLayer =======================================
 template <typename Dtype>
 class MKLDNNBatchNormLayer : public MKLDNNLayer<Dtype>, public Layer<Dtype> {
 public:
     explicit MKLDNNBatchNormLayer(const LayerParameter& param)
-        : Layer<Dtype>(param)
+        : MKLDNNLayer<Dtype>(param), Layer<Dtype>(param)
         , fwd_top_data(), fwd_bottom_data()
         , bwd_top_diff(), bwd_bottom_diff()
         , BatchNormFwd_pd(), BatchNormBwd_pd()
@@ -270,6 +297,12 @@ class MKLDNNLRNLayer : public MKLDNNLayer<Dtype> , public Layer<Dtype>  {
     MKLDNNPrimitive<Dtype> lrnFwd;
     MKLDNNPrimitive<Dtype> lrnBwd;
     shared_ptr<memory::desc> bottom_md;
+
+    int fl;
+    float scale;
+    shared_ptr<memory> buffer;
+    MKLDNNPrimitive<Dtype> lrn_reorder;
+
     shared_ptr<memory> fwd_top_data_memory, bwd_bottom_diff_memory, scratch_memory;
     shared_ptr<primitive> fwd_bottom_data_primitive, bwd_top_diff_primitive;
     Dtype alpha_, beta_, k_;
@@ -284,7 +317,7 @@ template <typename Dtype>
 class MKLDNNPoolingLayer : public MKLDNNLayer<Dtype>, public Layer<Dtype>  {
 public:
     explicit MKLDNNPoolingLayer(const LayerParameter& param)
-            : MKLDNNLayer<Dtype>(), Layer<Dtype>(param)
+            : MKLDNNLayer<Dtype>(param), Layer<Dtype>(param)
             , fwd_bottom_data(), fwd_top_data()
             , bwd_top_diff(), bwd_bottom_diff()
             , poolingFwd_pd()
@@ -359,7 +392,7 @@ class MKLDNNReLULayer : public MKLDNNLayer<Dtype> , public NeuronLayer<Dtype>  {
     *     the value @f$ \nu @f$ by which negative values are multiplied.
     */
   explicit MKLDNNReLULayer(const LayerParameter& param)
-    : MKLDNNLayer<Dtype>(), NeuronLayer<Dtype>(param)
+    : MKLDNNLayer<Dtype>(param), NeuronLayer<Dtype>(param)
     , fwd_top_data(), fwd_bottom_data()
     , bwd_top_diff(), bwd_bottom_diff()
     , reluFwd_pd(), reluBwd_pd()
@@ -405,7 +438,7 @@ template <typename Dtype>
 class MKLDNNConcatLayer : public MKLDNNLayer<Dtype> , public Layer<Dtype> {
 public:
     explicit MKLDNNConcatLayer(const LayerParameter& param)
-            : MKLDNNLayer<Dtype>(), Layer<Dtype>(param),
+            : MKLDNNLayer<Dtype>(param), Layer<Dtype>(param),
             concatFwd_pd(), fwd_output_memory(),
             bwd_reorder_input_memory(), bwd_reorder_output_memory(),
             fwd_top_data(), fwd_bottom_data(), split_dims() {
@@ -454,7 +487,7 @@ template <typename Dtype>
 class MKLDNNSplitLayer : public MKLDNNLayer<Dtype> , public Layer<Dtype> {
 public:
     explicit MKLDNNSplitLayer(const LayerParameter& param)
-            : MKLDNNLayer<Dtype>(), Layer<Dtype>(param),
+            : MKLDNNLayer<Dtype>(param), Layer<Dtype>(param),
               splitBwd_pd_(), bwd_bottom_diff_memory_()
             {
               PERFORMANCE_EVENT_ID_RESET(perf_id_bw_);
@@ -494,7 +527,7 @@ template <typename Dtype>
 class MKLDNNEltwiseLayer : public MKLDNNLayer<Dtype> , public Layer<Dtype>  {
 public:
   explicit MKLDNNEltwiseLayer(const LayerParameter& param)
-    : MKLDNNLayer<Dtype>(), Layer<Dtype>(param)
+    : MKLDNNLayer<Dtype>(param), Layer<Dtype>(param)
     , fwd_top_data(), fwd_bottom_data()
     , eltwiseFwd_pd()
     , fwd_top_data_memory()
diff --git a/include/caffe/mkldnn_base.hpp b/include/caffe/mkldnn_base.hpp
index 6e7c11b29..dc726c73d 100644
--- a/include/caffe/mkldnn_base.hpp
+++ b/include/caffe/mkldnn_base.hpp
@@ -46,6 +46,7 @@ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 #include "caffe/common.hpp"
 #include "caffe/util/math_functions.hpp"
 #include "mkldnn.hpp"
+#include "caffe/quant/base_quant_layer.hpp"
 
 using namespace mkldnn;
 
@@ -192,9 +193,9 @@ class StreamHolder
 
 // =====  MKLDNNLayer =======================================
 template <typename Dtype>
-class MKLDNNLayer {
+class MKLDNNLayer : public BaseQuantLayer<Dtype> {
 public:
-    explicit MKLDNNLayer() {}
+    explicit MKLDNNLayer(const LayerParameter &param);
     virtual ~MKLDNNLayer() {}
 protected:
     bool reshape;
diff --git a/include/caffe/mkldnn_memory.hpp b/include/caffe/mkldnn_memory.hpp
index 597ab95df..850028ff5 100644
--- a/include/caffe/mkldnn_memory.hpp
+++ b/include/caffe/mkldnn_memory.hpp
@@ -60,7 +60,17 @@ class MKLDNNMemoryDescriptorBase : public PrvMemDescr
 public:
     MKLDNNMemoryDescriptorBase(shared_ptr<memory::primitive_desc> usr_memory_pd
                                 , shared_ptr<memory::primitive_desc> prv_memory_pd
-                                , Blob<Dtype>* blob, MKLDNNLayer<Dtype>* mkldnn_layer);
+                                , Blob<Dtype>* blob, MKLDNNLayer<Dtype>* mkldnn_layer
+                                , std::vector<int>fl=std::vector<int>(1,0)
+                                , bool is_sum=false);
+
+    MKLDNNMemoryDescriptorBase(shared_ptr<memory::primitive_desc> usr_memory_pd
+                                , shared_ptr<memory::primitive_desc> prv_memory_pd
+                                , Blob<Dtype>* blob, MKLDNNLayer<Dtype>* mkldnn_layer
+                                , bool is_float
+                                , std::vector<float>scale=std::vector<float>(1,1.)
+                                , bool is_sum=false); 
+
 
     ~MKLDNNMemoryDescriptorBase() {}
     // ---- PrvMemDescr virtual functions -----
@@ -99,6 +109,20 @@ class MKLDNNMemoryDescriptorBase : public PrvMemDescr
     shared_ptr<primitive>  reorder_prv2usr() { return _reorder_prv2usr.aprimitive; }
     shared_ptr<primitive>  reorder_extprv2prv() { return _reorder_extprv2prv.aprimitive; }
 
+    float get_scale(int i) { return _scale[i]; }
+    std::vector<float> get_scale() { return _scale; }
+    void set_scale(std::vector<float> scale) { _scale.assign(scale.begin(),scale.end());}
+
+    int get_fl(int i) { return _fl[i]; }
+    std::vector<int> get_fl() { return _fl; }
+    void set_fl(std::vector<int> fl) { _fl.assign(fl.begin(),fl.end());}
+
+    void set_sum(bool is_sum) { _is_sum = is_sum; }
+    bool get_sum() { return _is_sum; }
+
+    void set_float(bool is_float) { _is_float = is_float; }
+    bool get_float() { return _is_float; }
+
     void set_mkldnn_layer(MKLDNNLayer<Dtype>* layer) { _mkldnn_layer = layer;  }
     MKLDNNLayer<Dtype>*  mkldnn_layer() const { return _mkldnn_layer;  }
 
@@ -130,28 +154,49 @@ class MKLDNNMemoryDescriptorBase : public PrvMemDescr
           // TODO: may need initialize memory by 0
         }
     }
-    void set_prv_memory_pd(shared_ptr<memory::primitive_desc> memory_pd)  {
+    void set_prv_memory_pd(shared_ptr<memory::primitive_desc> memory_pd, std::vector<float> scale)  {
         _prv_memory_pd = memory_pd;
         if (_prv_memory_pd && _usr_memory_pd) {
             check_usr_with_prv_descriptors();
-            this->create_reorder_descriptors();
+            this->create_reorder_descriptors(scale);
         }
     }
-    void set_extprv_memory_pd(shared_ptr<memory::primitive_desc> memory_pd)  {
+
+    void set_prv_memory_pd(shared_ptr<memory::primitive_desc> memory_pd, std::vector<int> fl)  {
+        _prv_memory_pd = memory_pd;
+        if (_prv_memory_pd && _usr_memory_pd) {
+            check_usr_with_prv_descriptors();
+            this->create_reorder_descriptors(fl);
+        }
+    }
+
+    void set_extprv_memory_pd(shared_ptr<memory::primitive_desc> memory_pd, std::vector<int> fl, std::vector<int> fl_ext, bool is_sum)  {
         _extprv_memory_pd = memory_pd;
         if (_prv_memory_pd && _usr_memory_pd) {
             check_usr_with_prv_descriptors();
-            this->create_reorder_descriptors();
+            this->create_reorder_descriptors(fl, fl_ext, is_sum);
         }
     }
-    void set_usr_memory_pd(shared_ptr<memory::primitive_desc> memory_pd) {
-        _usr_memory_pd = memory_pd;
+
+    void set_extprv_memory_pd(shared_ptr<memory::primitive_desc> memory_pd, std::vector<float> scale, std::vector<float> scale_ext, bool is_sum)  {
+        _extprv_memory_pd = memory_pd;
         if (_prv_memory_pd && _usr_memory_pd) {
             check_usr_with_prv_descriptors();
-            this->create_reorder_descriptors();
+            this->create_reorder_descriptors(scale, scale_ext, is_sum);
         }
     }
-    void create_reorder_descriptors();
+
+    void set_usr_memory_pd(shared_ptr<memory::primitive_desc> memory_pd, std::vector<float> scale) {
+        _usr_memory_pd = memory_pd;
+    }
+
+    void set_usr_memory_pd(shared_ptr<memory::primitive_desc> memory_pd, std::vector<int> fl) {
+        _usr_memory_pd = memory_pd;
+    }
+
+    void create_reorder_descriptors(std::vector<float> scale, std::vector<float>scale_ext=std::vector<float>(1,1.), bool is_sum=false);
+
+    void create_reorder_descriptors(std::vector<int> fl, std::vector<int>fl_ext=std::vector<int>(1,0), bool is_sum=false);
 
     shared_ptr<memory::primitive_desc> _usr_memory_pd;
     shared_ptr<memory::primitive_desc> _prv_memory_pd;
@@ -169,6 +214,10 @@ class MKLDNNMemoryDescriptorBase : public PrvMemDescr
 
     MKLDNNLayer<Dtype>* _mkldnn_layer;
     Blob<Dtype>* _blob;
+    std::vector<float> _scale = std::vector<float>(1,1.);
+    std::vector<int> _fl = std::vector<int>(1,0);
+    bool _is_sum = false;
+    bool _is_float = false;
 #ifdef USE_MLSL
     shared_ptr<char> _mlsl_memory;
 #endif
@@ -179,7 +228,16 @@ class MKLDNNMemoryDescriptor : public MKLDNNMemoryDescriptorBase<Dtype> {
 public:
     MKLDNNMemoryDescriptor(shared_ptr<memory::primitive_desc> usr_memory_pd
                         , shared_ptr<memory::primitive_desc> prv_memory_pd
-                        , Blob<Dtype>* blob, MKLDNNLayer<Dtype>* mkldnn_layer);
+                        , Blob<Dtype>* blob, MKLDNNLayer<Dtype>* mkldnn_layer
+                        , std::vector<int> fl=std::vector<int>(1,0)
+                        , bool is_sum=false);
+
+    MKLDNNMemoryDescriptor(shared_ptr<memory::primitive_desc> usr_memory_pd
+                        , shared_ptr<memory::primitive_desc> prv_memory_pd
+                        , Blob<Dtype>* blob, MKLDNNLayer<Dtype>* mkldnn_layer
+                        , bool is_float
+                        , std::vector<float> scale=std::vector<float>(1,1.)
+                        , bool is_sum=false);
 
     virtual void convert_from_prv(void* cpu_ptr);
     virtual void convert_to_prv(void* cpu_ptr);
@@ -218,8 +276,18 @@ class MKLDNNData : public MKLDNNMemoryDescriptor<Dtype, false>
 public:
     MKLDNNData(shared_ptr<memory::primitive_desc> usr_memory_pd
                 , shared_ptr<memory::primitive_desc> prv_memory_pd
-                , Blob<Dtype>* blob, MKLDNNLayer<Dtype>* mkldnn_layer)
-        : MKLDNNMemoryDescriptor<Dtype, false>(usr_memory_pd, prv_memory_pd, blob, mkldnn_layer) {}
+                , Blob<Dtype>* blob, MKLDNNLayer<Dtype>* mkldnn_layer
+                , std::vector<int> fl=std::vector<int>(1,0)
+                , bool is_sum=false)
+        : MKLDNNMemoryDescriptor<Dtype, false>(usr_memory_pd, prv_memory_pd, blob, mkldnn_layer, fl, is_sum) {}
+
+    MKLDNNData(shared_ptr<memory::primitive_desc> usr_memory_pd
+                , shared_ptr<memory::primitive_desc> prv_memory_pd
+                , Blob<Dtype>* blob, MKLDNNLayer<Dtype>* mkldnn_layer
+                , bool is_float
+                , std::vector<float> scale=std::vector<float>(1,1.)
+                , bool is_sum=false)
+        : MKLDNNMemoryDescriptor<Dtype, false>(usr_memory_pd, prv_memory_pd, blob, mkldnn_layer, is_float, scale, is_sum) {}
 };
 
 template <typename Dtype>
diff --git a/include/caffe/net.hpp b/include/caffe/net.hpp
index 3359ac813..f27f24473 100644
--- a/include/caffe/net.hpp
+++ b/include/caffe/net.hpp
@@ -312,7 +312,6 @@ class Net {
   */
   static void CompilationRuleFour(const NetParameter& param,
                              NetParameter* param_compiled);
-  
   /**
    * @brief If find "Conv--BN--Scale" in current network, merge BN and Scale layer into Convolution
    * layers, this optimization only works in caffe TEST phase now.
@@ -339,6 +338,24 @@ class Net {
   /// @brief return whether NetState state meets NetStateRule rule
   static bool StateMeetsRule(const NetState& state, const NetStateRule& rule,
       const string& layer_name);
+  /**
+   * @brief Look at the layer activations and parameters to find the maximum
+   * absolute values. The following layers are considered: Convolution,
+   * InnerProduct.
+   *
+   * @param layer_name The layers that should be quantized to fixed point.
+   * @param max_in The highest layer input.
+   * @param max_out The highest layer output.
+   * @param max_param The highest layer parameter.
+   *
+   * For layer parameters, the biases are ignored.
+   */
+  void RangeInLayers(vector<string>* layer_name, vector<Dtype>* max_in,
+      vector<Dtype>* max_out, vector<vector<Dtype>>* max_param, string scaling);
+  /**
+   * @brief Find the maximum value in a blob.
+   */
+  vector<Dtype> FindMax(Blob<Dtype>* blob, bool is_single=true);
   inline const map<string,int>& blob_names_index() const {
     return blob_names_index_;
   }
diff --git a/include/caffe/quant/base_quant_layer.hpp b/include/caffe/quant/base_quant_layer.hpp
new file mode 100644
index 000000000..c048ca33b
--- /dev/null
+++ b/include/caffe/quant/base_quant_layer.hpp
@@ -0,0 +1,62 @@
+/*
+All modification made by Intel Corporation: © 2016 Intel Corporation
+
+All contributions by the University of California:
+Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
+All rights reserved.
+
+All other contributions:
+Copyright (c) 2014, 2015, the respective contributors
+All rights reserved.
+For the list of contributors go to https://github.com/BVLC/caffe/blob/master/CONTRIBUTORS.md
+
+A part of the code referenced BVLC CAFFE ristretto branch
+For the original code go to https://github.com/pmgysel/caffe 
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+    * Redistributions of source code must retain the above copyright notice,
+      this list of conditions and the following disclaimer.
+    * Redistributions in binary form must reproduce the above copyright
+      notice, this list of conditions and the following disclaimer in the
+      documentation and/or other materials provided with the distribution.
+    * Neither the name of Intel Corporation nor the names of its contributors
+      may be used to endorse or promote products derived from this software
+      without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+*/
+
+#ifndef CAFFE_BASE_QUANT_LAYER_HPP_
+#define CAFFE_BASE_QUANT_LAYER_HPP_
+
+#include "caffe/proto/caffe.pb.h"
+
+namespace caffe {
+
+template <typename Dtype>
+class BaseQuantLayer{
+ public:
+  explicit BaseQuantLayer();
+ protected:
+  int bw_params_, bw_layer_in_, bw_layer_out_;
+  vector<int> fl_params_, fl_layer_in_, fl_layer_out_;
+  vector<float> scale_params_, scale_in_, scale_out_;
+  int rounding_, precision_;
+  bool need_quantize_;
+  bool is_float_;
+};
+
+}  // namespace caffe
+
+#endif  // CAFFE_BASE_QUANT_LAYER_HPP_
diff --git a/include/caffe/quant/quantization.hpp b/include/caffe/quant/quantization.hpp
new file mode 100644
index 000000000..2fc856830
--- /dev/null
+++ b/include/caffe/quant/quantization.hpp
@@ -0,0 +1,136 @@
+/*
+All modification made by Intel Corporation: © 2016 Intel Corporation
+
+All contributions by the University of California:
+Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
+All rights reserved.
+
+All other contributions:
+Copyright (c) 2014, 2015, the respective contributors
+All rights reserved.
+For the list of contributors go to https://github.com/BVLC/caffe/blob/master/CONTRIBUTORS.md
+
+A part of the code referenced BVLC CAFFE ristretto branch
+For the original code go to https://github.com/pmgysel/caffe 
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+    * Redistributions of source code must retain the above copyright notice,
+      this list of conditions and the following disclaimer.
+    * Redistributions in binary form must reproduce the above copyright
+      notice, this list of conditions and the following disclaimer in the
+      documentation and/or other materials provided with the distribution.
+    * Neither the name of Intel Corporation nor the names of its contributors
+      may be used to endorse or promote products derived from this software
+      without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+*/
+
+#ifndef QUANTIZATION_HPP_
+#define QUANTIZATION_HPP_
+
+#include "caffe/caffe.hpp"
+
+using caffe::string;
+using caffe::vector;
+using caffe::Net;
+
+/**
+ * @brief Approximate 32-bit floating point networks.
+ *
+ * This is the Ristretto tool. Use it to generate file descriptions of networks
+ * which use reduced word width arithmetic.
+ */
+class Quantization {
+public:
+  explicit Quantization(string model, string weights, string model_quantized,
+      int iterations, string trimming_mode, double error_margin, int score_number, string scaling="single", int detection=0, int power=1);
+  void QuantizeNet();
+private:
+  void CheckWritePermissions(const string path);
+  /**
+   * @brief Score network.
+   * @param accuracy Reports the network's accuracy according to
+   * accuracy_number.
+   * @param do_stats: Find the maximal values in each layer.
+   * @param score_number The accuracy layer that matters.
+   *
+   * For networks with multiple accuracy layers, set score_number to the
+   * appropriate value. For example, for BVLC GoogLeNet, use score_number=7.
+   */
+  void RunForwardBatches(const int iterations, Net<float>* caffe_net,
+      float* accuracy, const bool do_stats = false, const int score_number = 0); // 7 for GoogleNet-V1
+  /**
+   * @brief Quantize convolutional and fully connected layers to dynamic fixed
+   * point.
+   * The parameters and layer activations get quantized and the resulting
+   * network will be tested.
+   * Find the required number of bits required for parameters and layer
+   * activations (which might differ from each other).
+   */
+  void Quantize2DynamicFixedPoint();
+
+  /**
+   * @brief Change network to dynamic fixed point.
+   */
+  void EditNetDescriptionDynamicFixedPoint(caffe::NetParameter* param,
+      const string layer_quantize, const string network_part,
+      const int bw_conv, const int bw_in, const int bw_out);
+  
+  vector<int> GetIntegerLengthParams(const string layer_name);
+  vector<float> GetScaleParams(const string layer_name);
+  /**
+   * @brief Find the integer length for dynamic fixed point inputs of a certain
+   * layer.
+   */
+  int GetIntegerLengthIn(const string layer_name);
+  float GetScaleIn(const string layer_name);
+  /**
+   * @brief Find the integer length for dynamic fixed point outputs of a certain
+   * layer.
+   */
+  int GetIntegerLengthOut(const string layer_name);
+  float GetScaleOut(const string layer_name);
+
+  string model_;
+  string weights_;
+  string model_quantized_;
+  int iterations_;
+  string trimming_mode_;
+  double error_margin_;
+  int score_number;
+  string scaling;
+  int detection;
+  int power;
+  float test_score_baseline_;
+  // The maximal absolute values of layer inputs, parameters and
+  // layer outputs.
+  vector<float> max_in_, max_out_;
+  vector<vector<float>> max_params_;
+
+  // The integer bits for dynamic fixed point layer inputs, parameters and
+  // layer outputs.
+  vector<int> il_in_, il_out_;
+  vector<vector<int>> il_params_;
+
+  vector<float> scale_in_, scale_out_;
+  vector<vector<float>> scale_params_;
+  // The name of the layers that need to be quantized to dynamic fixed point.
+  vector<string> layer_names_;
+  // The number of bits used for dynamic fixed point layer inputs, parameters
+  // and layer outputs.
+  int bw_in_, bw_conv_params_, bw_fc_params_, bw_out_;
+};
+
+#endif // QUANTIZATION_HPP_
diff --git a/models/intel_optimized_models/int8/inceptionv3_int8.prototxt b/models/intel_optimized_models/int8/inceptionv3_int8.prototxt
new file mode 100644
index 000000000..ed0cbf632
--- /dev/null
+++ b/models/intel_optimized_models/int8/inceptionv3_int8.prototxt
@@ -0,0 +1,4568 @@
+name: "InceptionV3"
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "data"
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+      value: 0.0099999997764825821
+    }
+    shape {
+      dim: 64
+      dim: 3
+      dim: 299
+      dim: 299
+    }
+  }
+}
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "label"
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+    }
+    shape {
+      dim: 64
+    }
+  }
+}
+layer {
+  name: "conv_conv2d"
+  type: "Convolution"
+  bottom: "data"
+  top: "conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 32
+    bias_term: false
+    pad: 0
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+}
+layer {
+  name: "conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "conv_conv2d"
+  top: "conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "conv_relu"
+  type: "ReLU"
+  bottom: "conv_conv2d_bn"
+  top: "conv_conv2d_relu"
+}
+layer {
+  name: "conv_1_1_conv2d"
+  type: "Convolution"
+  bottom: "conv_conv2d_relu"
+  top: "conv_1_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 32
+    bias_term: false
+    pad: 0
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 5
+    fl_params: 6
+  }
+}
+layer {
+  name: "conv_1_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "conv_1_1_conv2d"
+  top: "conv_1_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "conv_1_1_relu"
+  type: "ReLU"
+  bottom: "conv_1_1_conv2d_bn"
+  top: "conv_1_1_conv2d_relu"
+}
+layer {
+  name: "conv_2_2_conv2d"
+  type: "Convolution"
+  bottom: "conv_1_1_conv2d_relu"
+  top: "conv_2_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 5
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "conv_2_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "conv_2_2_conv2d"
+  top: "conv_2_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "conv_2_2_relu"
+  type: "ReLU"
+  bottom: "conv_2_2_conv2d_bn"
+  top: "conv_2_2_conv2d_relu"
+}
+layer {
+  name: "pool"
+  type: "Pooling"
+  bottom: "conv_2_2_conv2d_relu"
+  top: "pool"
+  pooling_param {
+    pool: MAX
+    pad: 0
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "conv_3_3_conv2d"
+  type: "Convolution"
+  bottom: "pool"
+  top: "conv_3_3_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 80
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 6
+  }
+}
+layer {
+  name: "conv_3_3_batchnorm"
+  type: "BatchNorm"
+  bottom: "conv_3_3_conv2d"
+  top: "conv_3_3_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "conv_3_3_relu"
+  type: "ReLU"
+  bottom: "conv_3_3_conv2d_bn"
+  top: "conv_3_3_conv2d_relu"
+}
+layer {
+  name: "conv_4_4_conv2d"
+  type: "Convolution"
+  bottom: "conv_3_3_conv2d_relu"
+  top: "conv_4_4_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 32 #FIXME 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 16 #FIXME 6
+    fl_params: 8
+  }
+}
+layer {
+  name: "conv_4_4_batchnorm"
+  type: "BatchNorm"
+  bottom: "conv_4_4_conv2d"
+  top: "conv_4_4_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "conv_4_4_relu"
+  type: "ReLU"
+  bottom: "conv_4_4_conv2d_bn"
+  top: "conv_4_4_conv2d_relu"
+}
+layer {
+  name: "pool1"
+  type: "Pooling"
+  bottom: "conv_4_4_conv2d_relu"
+  top: "pool1"
+  pooling_param {
+    pool: MAX
+    pad: 0
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "mixed_conv_conv2d"
+  type: "Convolution"
+  bottom: "pool1"
+  top: "mixed_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_conv_conv2d"
+  top: "mixed_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_conv_conv2d_bn"
+  top: "mixed_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_tower_conv_conv2d"
+  type: "Convolution"
+  bottom: "pool1"
+  top: "mixed_tower_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 48
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_tower_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_tower_conv_conv2d"
+  top: "mixed_tower_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_tower_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_tower_conv_conv2d_bn"
+  top: "mixed_tower_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_tower_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_tower_conv_conv2d_relu"
+  top: "mixed_tower_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 2
+    kernel_size: 5
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_tower_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_tower_conv_1_conv2d"
+  top: "mixed_tower_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_tower_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_tower_conv_1_conv2d_bn"
+  top: "mixed_tower_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_tower_1_conv_conv2d"
+  type: "Convolution"
+  bottom: "pool1"
+  top: "mixed_tower_1_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_tower_1_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_tower_1_conv_conv2d"
+  top: "mixed_tower_1_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_tower_1_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_tower_1_conv_conv2d_bn"
+  top: "mixed_tower_1_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_tower_1_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_tower_1_conv_conv2d_relu"
+  top: "mixed_tower_1_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 96
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_tower_1_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_tower_1_conv_1_conv2d"
+  top: "mixed_tower_1_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_tower_1_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_tower_1_conv_1_conv2d_bn"
+  top: "mixed_tower_1_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_tower_1_conv_2_conv2d"
+  type: "Convolution"
+  bottom: "mixed_tower_1_conv_1_conv2d_relu"
+  top: "mixed_tower_1_conv_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 96
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 6
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_tower_1_conv_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_tower_1_conv_2_conv2d"
+  top: "mixed_tower_1_conv_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_tower_1_conv_2_relu"
+  type: "ReLU"
+  bottom: "mixed_tower_1_conv_2_conv2d_bn"
+  top: "mixed_tower_1_conv_2_conv2d_relu"
+}
+layer {
+  name: "AVE_pool_mixed_pool"
+  type: "Pooling"
+  bottom: "pool1"
+  top: "AVE_pool_mixed_pool"
+  pooling_param {
+    pool: AVE
+    pad: 1
+    kernel_size: 3
+    stride: 1
+  }
+}
+layer {
+  name: "mixed_tower_2_conv_conv2d"
+  type: "Convolution"
+  bottom: "AVE_pool_mixed_pool"
+  top: "mixed_tower_2_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 32
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_tower_2_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_tower_2_conv_conv2d"
+  top: "mixed_tower_2_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_tower_2_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_tower_2_conv_conv2d_bn"
+  top: "mixed_tower_2_conv_conv2d_relu"
+}
+layer {
+  name: "ch_concat_mixed_chconcat"
+  type: "Concat"
+  bottom: "mixed_conv_conv2d_relu"
+  bottom: "mixed_tower_conv_1_conv2d_relu"
+  bottom: "mixed_tower_1_conv_2_conv2d_relu"
+  bottom: "mixed_tower_2_conv_conv2d_relu"
+  top: "ch_concat_mixed_chconcat"
+  concat_param {
+    axis: 1
+  }
+}
+layer {
+  name: "mixed_1_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_chconcat"
+  top: "mixed_1_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_1_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_1_conv_conv2d"
+  top: "mixed_1_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_1_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_1_conv_conv2d_bn"
+  top: "mixed_1_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_1_tower_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_chconcat"
+  top: "mixed_1_tower_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 48
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_1_tower_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_1_tower_conv_conv2d"
+  top: "mixed_1_tower_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_1_tower_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_1_tower_conv_conv2d_bn"
+  top: "mixed_1_tower_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_1_tower_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_1_tower_conv_conv2d_relu"
+  top: "mixed_1_tower_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 2
+    kernel_size: 5
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 9
+  }
+}
+layer {
+  name: "mixed_1_tower_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_1_tower_conv_1_conv2d"
+  top: "mixed_1_tower_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_1_tower_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_1_tower_conv_1_conv2d_bn"
+  top: "mixed_1_tower_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_1_tower_1_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_chconcat"
+  top: "mixed_1_tower_1_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_1_tower_1_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_1_tower_1_conv_conv2d"
+  top: "mixed_1_tower_1_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_1_tower_1_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_1_tower_1_conv_conv2d_bn"
+  top: "mixed_1_tower_1_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_1_tower_1_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_1_tower_1_conv_conv2d_relu"
+  top: "mixed_1_tower_1_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 96
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_1_tower_1_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_1_tower_1_conv_1_conv2d"
+  top: "mixed_1_tower_1_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_1_tower_1_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_1_tower_1_conv_1_conv2d_bn"
+  top: "mixed_1_tower_1_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_1_tower_1_conv_2_conv2d"
+  type: "Convolution"
+  bottom: "mixed_1_tower_1_conv_1_conv2d_relu"
+  top: "mixed_1_tower_1_conv_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 96
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 6
+    fl_params: 6
+  }
+}
+layer {
+  name: "mixed_1_tower_1_conv_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_1_tower_1_conv_2_conv2d"
+  top: "mixed_1_tower_1_conv_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_1_tower_1_conv_2_relu"
+  type: "ReLU"
+  bottom: "mixed_1_tower_1_conv_2_conv2d_bn"
+  top: "mixed_1_tower_1_conv_2_conv2d_relu"
+}
+layer {
+  name: "AVE_pool_mixed_1_pool"
+  type: "Pooling"
+  bottom: "ch_concat_mixed_chconcat"
+  top: "AVE_pool_mixed_1_pool"
+  pooling_param {
+    pool: AVE
+    pad: 1
+    kernel_size: 3
+    stride: 1
+  }
+}
+layer {
+  name: "mixed_1_tower_2_conv_conv2d"
+  type: "Convolution"
+  bottom: "AVE_pool_mixed_1_pool"
+  top: "mixed_1_tower_2_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_1_tower_2_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_1_tower_2_conv_conv2d"
+  top: "mixed_1_tower_2_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_1_tower_2_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_1_tower_2_conv_conv2d_bn"
+  top: "mixed_1_tower_2_conv_conv2d_relu"
+}
+layer {
+  name: "ch_concat_mixed_1_chconcat"
+  type: "Concat"
+  bottom: "mixed_1_conv_conv2d_relu"
+  bottom: "mixed_1_tower_conv_1_conv2d_relu"
+  bottom: "mixed_1_tower_1_conv_2_conv2d_relu"
+  bottom: "mixed_1_tower_2_conv_conv2d_relu"
+  top: "ch_concat_mixed_1_chconcat"
+  concat_param {
+    axis: 1
+  }
+}
+layer {
+  name: "mixed_2_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_1_chconcat"
+  top: "mixed_2_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_2_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_2_conv_conv2d"
+  top: "mixed_2_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_2_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_2_conv_conv2d_bn"
+  top: "mixed_2_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_2_tower_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_1_chconcat"
+  top: "mixed_2_tower_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 48
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_2_tower_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_2_tower_conv_conv2d"
+  top: "mixed_2_tower_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_2_tower_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_2_tower_conv_conv2d_bn"
+  top: "mixed_2_tower_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_2_tower_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_2_tower_conv_conv2d_relu"
+  top: "mixed_2_tower_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 2
+    kernel_size: 5
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 9
+  }
+}
+layer {
+  name: "mixed_2_tower_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_2_tower_conv_1_conv2d"
+  top: "mixed_2_tower_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_2_tower_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_2_tower_conv_1_conv2d_bn"
+  top: "mixed_2_tower_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_2_tower_1_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_1_chconcat"
+  top: "mixed_2_tower_1_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_2_tower_1_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_2_tower_1_conv_conv2d"
+  top: "mixed_2_tower_1_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_2_tower_1_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_2_tower_1_conv_conv2d_bn"
+  top: "mixed_2_tower_1_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_2_tower_1_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_2_tower_1_conv_conv2d_relu"
+  top: "mixed_2_tower_1_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 96
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_2_tower_1_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_2_tower_1_conv_1_conv2d"
+  top: "mixed_2_tower_1_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_2_tower_1_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_2_tower_1_conv_1_conv2d_bn"
+  top: "mixed_2_tower_1_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_2_tower_1_conv_2_conv2d"
+  type: "Convolution"
+  bottom: "mixed_2_tower_1_conv_1_conv2d_relu"
+  top: "mixed_2_tower_1_conv_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 96
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_2_tower_1_conv_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_2_tower_1_conv_2_conv2d"
+  top: "mixed_2_tower_1_conv_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_2_tower_1_conv_2_relu"
+  type: "ReLU"
+  bottom: "mixed_2_tower_1_conv_2_conv2d_bn"
+  top: "mixed_2_tower_1_conv_2_conv2d_relu"
+}
+layer {
+  name: "AVE_pool_mixed_2_pool"
+  type: "Pooling"
+  bottom: "ch_concat_mixed_1_chconcat"
+  top: "AVE_pool_mixed_2_pool"
+  pooling_param {
+    pool: AVE
+    pad: 1
+    kernel_size: 3
+    stride: 1
+  }
+}
+layer {
+  name: "mixed_2_tower_2_conv_conv2d"
+  type: "Convolution"
+  bottom: "AVE_pool_mixed_2_pool"
+  top: "mixed_2_tower_2_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_2_tower_2_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_2_tower_2_conv_conv2d"
+  top: "mixed_2_tower_2_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_2_tower_2_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_2_tower_2_conv_conv2d_bn"
+  top: "mixed_2_tower_2_conv_conv2d_relu"
+}
+layer {
+  name: "ch_concat_mixed_2_chconcat"
+  type: "Concat"
+  bottom: "mixed_2_conv_conv2d_relu"
+  bottom: "mixed_2_tower_conv_1_conv2d_relu"
+  bottom: "mixed_2_tower_1_conv_2_conv2d_relu"
+  bottom: "mixed_2_tower_2_conv_conv2d_relu"
+  top: "ch_concat_mixed_2_chconcat"
+  concat_param {
+    axis: 1
+  }
+}
+layer {
+  name: "mixed_3_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_2_chconcat"
+  top: "mixed_3_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 384
+    bias_term: false
+    pad: 0
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_3_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_3_conv_conv2d"
+  top: "mixed_3_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_3_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_3_conv_conv2d_bn"
+  top: "mixed_3_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_3_tower_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_2_chconcat"
+  top: "mixed_3_tower_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_3_tower_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_3_tower_conv_conv2d"
+  top: "mixed_3_tower_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_3_tower_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_3_tower_conv_conv2d_bn"
+  top: "mixed_3_tower_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_3_tower_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_3_tower_conv_conv2d_relu"
+  top: "mixed_3_tower_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 96
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 8
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_3_tower_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_3_tower_conv_1_conv2d"
+  top: "mixed_3_tower_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_3_tower_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_3_tower_conv_1_conv2d_bn"
+  top: "mixed_3_tower_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_3_tower_conv_2_conv2d"
+  type: "Convolution"
+  bottom: "mixed_3_tower_conv_1_conv2d_relu"
+  top: "mixed_3_tower_conv_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 96
+    bias_term: false
+    pad: 0
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 8
+    fl_layer_out: 6
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_3_tower_conv_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_3_tower_conv_2_conv2d"
+  top: "mixed_3_tower_conv_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_3_tower_conv_2_relu"
+  type: "ReLU"
+  bottom: "mixed_3_tower_conv_2_conv2d_bn"
+  top: "mixed_3_tower_conv_2_conv2d_relu"
+}
+layer {
+  name: "max_pool_mixed_3_pool"
+  type: "Pooling"
+  bottom: "ch_concat_mixed_2_chconcat"
+  top: "max_pool_mixed_3_pool"
+  pooling_param {
+    pool: MAX
+    pad: 0
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "ch_concat_mixed_3_chconcat"
+  type: "Concat"
+  bottom: "max_pool_mixed_3_pool"
+  bottom: "mixed_3_conv_conv2d_relu"
+  bottom: "mixed_3_tower_conv_2_conv2d_relu"
+  top: "ch_concat_mixed_3_chconcat"
+  concat_param {
+    axis: 1
+  }
+}
+layer {
+  name: "mixed_4_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_3_chconcat"
+  top: "mixed_4_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_4_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_4_conv_conv2d"
+  top: "mixed_4_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_4_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_4_conv_conv2d_bn"
+  top: "mixed_4_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_4_tower_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_3_chconcat"
+  top: "mixed_4_tower_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_4_tower_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_4_tower_conv_conv2d"
+  top: "mixed_4_tower_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_4_tower_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_4_tower_conv_conv2d_bn"
+  top: "mixed_4_tower_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_4_tower_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_4_tower_conv_conv2d_relu"
+  top: "mixed_4_tower_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 3
+    kernel_h: 1
+    kernel_w: 7
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_4_tower_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_4_tower_conv_1_conv2d"
+  top: "mixed_4_tower_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_4_tower_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_4_tower_conv_1_conv2d_bn"
+  top: "mixed_4_tower_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_4_tower_conv_2_conv2d"
+  type: "Convolution"
+  bottom: "mixed_4_tower_conv_1_conv2d_relu"
+  top: "mixed_4_tower_conv_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 3
+    pad_w: 0
+    kernel_h: 7
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_4_tower_conv_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_4_tower_conv_2_conv2d"
+  top: "mixed_4_tower_conv_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_4_tower_conv_2_relu"
+  type: "ReLU"
+  bottom: "mixed_4_tower_conv_2_conv2d_bn"
+  top: "mixed_4_tower_conv_2_conv2d_relu"
+}
+layer {
+  name: "mixed_4_tower_1_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_3_chconcat"
+  top: "mixed_4_tower_1_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 8
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_4_tower_1_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_4_tower_1_conv_conv2d"
+  top: "mixed_4_tower_1_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_4_tower_1_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_4_tower_1_conv_conv2d_bn"
+  top: "mixed_4_tower_1_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_4_tower_1_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_4_tower_1_conv_conv2d_relu"
+  top: "mixed_4_tower_1_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 3
+    pad_w: 0
+    kernel_h: 7
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 8
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_4_tower_1_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_4_tower_1_conv_1_conv2d"
+  top: "mixed_4_tower_1_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_4_tower_1_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_4_tower_1_conv_1_conv2d_bn"
+  top: "mixed_4_tower_1_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_4_tower_1_conv_2_conv2d"
+  type: "Convolution"
+  bottom: "mixed_4_tower_1_conv_1_conv2d_relu"
+  top: "mixed_4_tower_1_conv_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 3
+    kernel_h: 1
+    kernel_w: 7
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_4_tower_1_conv_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_4_tower_1_conv_2_conv2d"
+  top: "mixed_4_tower_1_conv_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_4_tower_1_conv_2_relu"
+  type: "ReLU"
+  bottom: "mixed_4_tower_1_conv_2_conv2d_bn"
+  top: "mixed_4_tower_1_conv_2_conv2d_relu"
+}
+layer {
+  name: "mixed_4_tower_1_conv_3_conv2d"
+  type: "Convolution"
+  bottom: "mixed_4_tower_1_conv_2_conv2d_relu"
+  top: "mixed_4_tower_1_conv_3_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 3
+    pad_w: 0
+    kernel_h: 7
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_4_tower_1_conv_3_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_4_tower_1_conv_3_conv2d"
+  top: "mixed_4_tower_1_conv_3_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_4_tower_1_conv_3_relu"
+  type: "ReLU"
+  bottom: "mixed_4_tower_1_conv_3_conv2d_bn"
+  top: "mixed_4_tower_1_conv_3_conv2d_relu"
+}
+layer {
+  name: "mixed_4_tower_1_conv_4_conv2d"
+  type: "Convolution"
+  bottom: "mixed_4_tower_1_conv_3_conv2d_relu"
+  top: "mixed_4_tower_1_conv_4_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 3
+    kernel_h: 1
+    kernel_w: 7
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_4_tower_1_conv_4_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_4_tower_1_conv_4_conv2d"
+  top: "mixed_4_tower_1_conv_4_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_4_tower_1_conv_4_relu"
+  type: "ReLU"
+  bottom: "mixed_4_tower_1_conv_4_conv2d_bn"
+  top: "mixed_4_tower_1_conv_4_conv2d_relu"
+}
+layer {
+  name: "AVE_pool_mixed_4_pool"
+  type: "Pooling"
+  bottom: "ch_concat_mixed_3_chconcat"
+  top: "AVE_pool_mixed_4_pool"
+  pooling_param {
+    pool: AVE
+    pad: 1
+    kernel_size: 3
+    stride: 1
+  }
+}
+layer {
+  name: "mixed_4_tower_2_conv_conv2d"
+  type: "Convolution"
+  bottom: "AVE_pool_mixed_4_pool"
+  top: "mixed_4_tower_2_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 6
+  }
+}
+layer {
+  name: "mixed_4_tower_2_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_4_tower_2_conv_conv2d"
+  top: "mixed_4_tower_2_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_4_tower_2_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_4_tower_2_conv_conv2d_bn"
+  top: "mixed_4_tower_2_conv_conv2d_relu"
+}
+layer {
+  name: "ch_concat_mixed_4_chconcat"
+  type: "Concat"
+  bottom: "mixed_4_conv_conv2d_relu"
+  bottom: "mixed_4_tower_conv_2_conv2d_relu"
+  bottom: "mixed_4_tower_1_conv_4_conv2d_relu"
+  bottom: "mixed_4_tower_2_conv_conv2d_relu"
+  top: "ch_concat_mixed_4_chconcat"
+  concat_param {
+    axis: 1
+  }
+}
+layer {
+  name: "mixed_5_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_4_chconcat"
+  top: "mixed_5_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_5_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_5_conv_conv2d"
+  top: "mixed_5_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_5_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_5_conv_conv2d_bn"
+  top: "mixed_5_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_5_tower_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_4_chconcat"
+  top: "mixed_5_tower_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 160
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_5_tower_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_5_tower_conv_conv2d"
+  top: "mixed_5_tower_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_5_tower_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_5_tower_conv_conv2d_bn"
+  top: "mixed_5_tower_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_5_tower_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_5_tower_conv_conv2d_relu"
+  top: "mixed_5_tower_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 160
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 3
+    kernel_h: 1
+    kernel_w: 7
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_5_tower_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_5_tower_conv_1_conv2d"
+  top: "mixed_5_tower_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_5_tower_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_5_tower_conv_1_conv2d_bn"
+  top: "mixed_5_tower_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_5_tower_conv_2_conv2d"
+  type: "Convolution"
+  bottom: "mixed_5_tower_conv_1_conv2d_relu"
+  top: "mixed_5_tower_conv_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 3
+    pad_w: 0
+    kernel_h: 7
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_5_tower_conv_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_5_tower_conv_2_conv2d"
+  top: "mixed_5_tower_conv_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_5_tower_conv_2_relu"
+  type: "ReLU"
+  bottom: "mixed_5_tower_conv_2_conv2d_bn"
+  top: "mixed_5_tower_conv_2_conv2d_relu"
+}
+layer {
+  name: "mixed_5_tower_1_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_4_chconcat"
+  top: "mixed_5_tower_1_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 160
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_5_tower_1_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_5_tower_1_conv_conv2d"
+  top: "mixed_5_tower_1_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_5_tower_1_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_5_tower_1_conv_conv2d_bn"
+  top: "mixed_5_tower_1_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_5_tower_1_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_5_tower_1_conv_conv2d_relu"
+  top: "mixed_5_tower_1_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 160
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 3
+    pad_w: 0
+    kernel_h: 7
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_5_tower_1_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_5_tower_1_conv_1_conv2d"
+  top: "mixed_5_tower_1_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_5_tower_1_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_5_tower_1_conv_1_conv2d_bn"
+  top: "mixed_5_tower_1_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_5_tower_1_conv_2_conv2d"
+  type: "Convolution"
+  bottom: "mixed_5_tower_1_conv_1_conv2d_relu"
+  top: "mixed_5_tower_1_conv_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 160
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 3
+    kernel_h: 1
+    kernel_w: 7
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_5_tower_1_conv_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_5_tower_1_conv_2_conv2d"
+  top: "mixed_5_tower_1_conv_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_5_tower_1_conv_2_relu"
+  type: "ReLU"
+  bottom: "mixed_5_tower_1_conv_2_conv2d_bn"
+  top: "mixed_5_tower_1_conv_2_conv2d_relu"
+}
+layer {
+  name: "mixed_5_tower_1_conv_3_conv2d"
+  type: "Convolution"
+  bottom: "mixed_5_tower_1_conv_2_conv2d_relu"
+  top: "mixed_5_tower_1_conv_3_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 160
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 3
+    pad_w: 0
+    kernel_h: 7
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_5_tower_1_conv_3_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_5_tower_1_conv_3_conv2d"
+  top: "mixed_5_tower_1_conv_3_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_5_tower_1_conv_3_relu"
+  type: "ReLU"
+  bottom: "mixed_5_tower_1_conv_3_conv2d_bn"
+  top: "mixed_5_tower_1_conv_3_conv2d_relu"
+}
+layer {
+  name: "mixed_5_tower_1_conv_4_conv2d"
+  type: "Convolution"
+  bottom: "mixed_5_tower_1_conv_3_conv2d_relu"
+  top: "mixed_5_tower_1_conv_4_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 3
+    kernel_h: 1
+    kernel_w: 7
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_5_tower_1_conv_4_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_5_tower_1_conv_4_conv2d"
+  top: "mixed_5_tower_1_conv_4_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_5_tower_1_conv_4_relu"
+  type: "ReLU"
+  bottom: "mixed_5_tower_1_conv_4_conv2d_bn"
+  top: "mixed_5_tower_1_conv_4_conv2d_relu"
+}
+layer {
+  name: "AVE_pool_mixed_5_pool"
+  type: "Pooling"
+  bottom: "ch_concat_mixed_4_chconcat"
+  top: "AVE_pool_mixed_5_pool"
+  pooling_param {
+    pool: AVE
+    pad: 1
+    kernel_size: 3
+    stride: 1
+  }
+}
+layer {
+  name: "mixed_5_tower_2_conv_conv2d"
+  type: "Convolution"
+  bottom: "AVE_pool_mixed_5_pool"
+  top: "mixed_5_tower_2_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_5_tower_2_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_5_tower_2_conv_conv2d"
+  top: "mixed_5_tower_2_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_5_tower_2_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_5_tower_2_conv_conv2d_bn"
+  top: "mixed_5_tower_2_conv_conv2d_relu"
+}
+layer {
+  name: "ch_concat_mixed_5_chconcat"
+  type: "Concat"
+  bottom: "mixed_5_conv_conv2d_relu"
+  bottom: "mixed_5_tower_conv_2_conv2d_relu"
+  bottom: "mixed_5_tower_1_conv_4_conv2d_relu"
+  bottom: "mixed_5_tower_2_conv_conv2d_relu"
+  top: "ch_concat_mixed_5_chconcat"
+  concat_param {
+    axis: 1
+  }
+}
+layer {
+  name: "mixed_6_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_5_chconcat"
+  top: "mixed_6_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_6_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_6_conv_conv2d"
+  top: "mixed_6_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_6_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_6_conv_conv2d_bn"
+  top: "mixed_6_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_6_tower_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_5_chconcat"
+  top: "mixed_6_tower_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 160
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_6_tower_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_6_tower_conv_conv2d"
+  top: "mixed_6_tower_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_6_tower_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_6_tower_conv_conv2d_bn"
+  top: "mixed_6_tower_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_6_tower_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_6_tower_conv_conv2d_relu"
+  top: "mixed_6_tower_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 160
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 3
+    kernel_h: 1
+    kernel_w: 7
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_6_tower_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_6_tower_conv_1_conv2d"
+  top: "mixed_6_tower_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_6_tower_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_6_tower_conv_1_conv2d_bn"
+  top: "mixed_6_tower_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_6_tower_conv_2_conv2d"
+  type: "Convolution"
+  bottom: "mixed_6_tower_conv_1_conv2d_relu"
+  top: "mixed_6_tower_conv_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 3
+    pad_w: 0
+    kernel_h: 7
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_6_tower_conv_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_6_tower_conv_2_conv2d"
+  top: "mixed_6_tower_conv_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_6_tower_conv_2_relu"
+  type: "ReLU"
+  bottom: "mixed_6_tower_conv_2_conv2d_bn"
+  top: "mixed_6_tower_conv_2_conv2d_relu"
+}
+layer {
+  name: "mixed_6_tower_1_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_5_chconcat"
+  top: "mixed_6_tower_1_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 160
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_6_tower_1_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_6_tower_1_conv_conv2d"
+  top: "mixed_6_tower_1_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_6_tower_1_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_6_tower_1_conv_conv2d_bn"
+  top: "mixed_6_tower_1_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_6_tower_1_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_6_tower_1_conv_conv2d_relu"
+  top: "mixed_6_tower_1_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 160
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 3
+    pad_w: 0
+    kernel_h: 7
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_6_tower_1_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_6_tower_1_conv_1_conv2d"
+  top: "mixed_6_tower_1_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_6_tower_1_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_6_tower_1_conv_1_conv2d_bn"
+  top: "mixed_6_tower_1_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_6_tower_1_conv_2_conv2d"
+  type: "Convolution"
+  bottom: "mixed_6_tower_1_conv_1_conv2d_relu"
+  top: "mixed_6_tower_1_conv_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 160
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 3
+    kernel_h: 1
+    kernel_w: 7
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_6_tower_1_conv_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_6_tower_1_conv_2_conv2d"
+  top: "mixed_6_tower_1_conv_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_6_tower_1_conv_2_relu"
+  type: "ReLU"
+  bottom: "mixed_6_tower_1_conv_2_conv2d_bn"
+  top: "mixed_6_tower_1_conv_2_conv2d_relu"
+}
+layer {
+  name: "mixed_6_tower_1_conv_3_conv2d"
+  type: "Convolution"
+  bottom: "mixed_6_tower_1_conv_2_conv2d_relu"
+  top: "mixed_6_tower_1_conv_3_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 160
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 3
+    pad_w: 0
+    kernel_h: 7
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_6_tower_1_conv_3_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_6_tower_1_conv_3_conv2d"
+  top: "mixed_6_tower_1_conv_3_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_6_tower_1_conv_3_relu"
+  type: "ReLU"
+  bottom: "mixed_6_tower_1_conv_3_conv2d_bn"
+  top: "mixed_6_tower_1_conv_3_conv2d_relu"
+}
+layer {
+  name: "mixed_6_tower_1_conv_4_conv2d"
+  type: "Convolution"
+  bottom: "mixed_6_tower_1_conv_3_conv2d_relu"
+  top: "mixed_6_tower_1_conv_4_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 3
+    kernel_h: 1
+    kernel_w: 7
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_6_tower_1_conv_4_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_6_tower_1_conv_4_conv2d"
+  top: "mixed_6_tower_1_conv_4_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_6_tower_1_conv_4_relu"
+  type: "ReLU"
+  bottom: "mixed_6_tower_1_conv_4_conv2d_bn"
+  top: "mixed_6_tower_1_conv_4_conv2d_relu"
+}
+layer {
+  name: "AVE_pool_mixed_6_pool"
+  type: "Pooling"
+  bottom: "ch_concat_mixed_5_chconcat"
+  top: "AVE_pool_mixed_6_pool"
+  pooling_param {
+    pool: AVE
+    pad: 1
+    kernel_size: 3
+    stride: 1
+  }
+}
+layer {
+  name: "mixed_6_tower_2_conv_conv2d"
+  type: "Convolution"
+  bottom: "AVE_pool_mixed_6_pool"
+  top: "mixed_6_tower_2_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 6
+  }
+}
+layer {
+  name: "mixed_6_tower_2_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_6_tower_2_conv_conv2d"
+  top: "mixed_6_tower_2_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_6_tower_2_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_6_tower_2_conv_conv2d_bn"
+  top: "mixed_6_tower_2_conv_conv2d_relu"
+}
+layer {
+  name: "ch_concat_mixed_6_chconcat"
+  type: "Concat"
+  bottom: "mixed_6_conv_conv2d_relu"
+  bottom: "mixed_6_tower_conv_2_conv2d_relu"
+  bottom: "mixed_6_tower_1_conv_4_conv2d_relu"
+  bottom: "mixed_6_tower_2_conv_conv2d_relu"
+  top: "ch_concat_mixed_6_chconcat"
+  concat_param {
+    axis: 1
+  }
+}
+layer {
+  name: "mixed_7_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_6_chconcat"
+  top: "mixed_7_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_7_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_7_conv_conv2d"
+  top: "mixed_7_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_7_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_7_conv_conv2d_bn"
+  top: "mixed_7_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_7_tower_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_6_chconcat"
+  top: "mixed_7_tower_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_7_tower_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_7_tower_conv_conv2d"
+  top: "mixed_7_tower_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_7_tower_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_7_tower_conv_conv2d_bn"
+  top: "mixed_7_tower_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_7_tower_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_7_tower_conv_conv2d_relu"
+  top: "mixed_7_tower_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 3
+    kernel_h: 1
+    kernel_w: 7
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 6
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_7_tower_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_7_tower_conv_1_conv2d"
+  top: "mixed_7_tower_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_7_tower_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_7_tower_conv_1_conv2d_bn"
+  top: "mixed_7_tower_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_7_tower_conv_2_conv2d"
+  type: "Convolution"
+  bottom: "mixed_7_tower_conv_1_conv2d_relu"
+  top: "mixed_7_tower_conv_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 3
+    pad_w: 0
+    kernel_h: 7
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_7_tower_conv_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_7_tower_conv_2_conv2d"
+  top: "mixed_7_tower_conv_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_7_tower_conv_2_relu"
+  type: "ReLU"
+  bottom: "mixed_7_tower_conv_2_conv2d_bn"
+  top: "mixed_7_tower_conv_2_conv2d_relu"
+}
+layer {
+  name: "mixed_7_tower_1_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_6_chconcat"
+  top: "mixed_7_tower_1_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_7_tower_1_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_7_tower_1_conv_conv2d"
+  top: "mixed_7_tower_1_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_7_tower_1_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_7_tower_1_conv_conv2d_bn"
+  top: "mixed_7_tower_1_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_7_tower_1_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_7_tower_1_conv_conv2d_relu"
+  top: "mixed_7_tower_1_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 3
+    pad_w: 0
+    kernel_h: 7
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_7_tower_1_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_7_tower_1_conv_1_conv2d"
+  top: "mixed_7_tower_1_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_7_tower_1_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_7_tower_1_conv_1_conv2d_bn"
+  top: "mixed_7_tower_1_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_7_tower_1_conv_2_conv2d"
+  type: "Convolution"
+  bottom: "mixed_7_tower_1_conv_1_conv2d_relu"
+  top: "mixed_7_tower_1_conv_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 3
+    kernel_h: 1
+    kernel_w: 7
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_7_tower_1_conv_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_7_tower_1_conv_2_conv2d"
+  top: "mixed_7_tower_1_conv_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_7_tower_1_conv_2_relu"
+  type: "ReLU"
+  bottom: "mixed_7_tower_1_conv_2_conv2d_bn"
+  top: "mixed_7_tower_1_conv_2_conv2d_relu"
+}
+layer {
+  name: "mixed_7_tower_1_conv_3_conv2d"
+  type: "Convolution"
+  bottom: "mixed_7_tower_1_conv_2_conv2d_relu"
+  top: "mixed_7_tower_1_conv_3_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 3
+    pad_w: 0
+    kernel_h: 7
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_7_tower_1_conv_3_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_7_tower_1_conv_3_conv2d"
+  top: "mixed_7_tower_1_conv_3_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_7_tower_1_conv_3_relu"
+  type: "ReLU"
+  bottom: "mixed_7_tower_1_conv_3_conv2d_bn"
+  top: "mixed_7_tower_1_conv_3_conv2d_relu"
+}
+layer {
+  name: "mixed_7_tower_1_conv_4_conv2d"
+  type: "Convolution"
+  bottom: "mixed_7_tower_1_conv_3_conv2d_relu"
+  top: "mixed_7_tower_1_conv_4_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 3
+    kernel_h: 1
+    kernel_w: 7
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_7_tower_1_conv_4_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_7_tower_1_conv_4_conv2d"
+  top: "mixed_7_tower_1_conv_4_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_7_tower_1_conv_4_relu"
+  type: "ReLU"
+  bottom: "mixed_7_tower_1_conv_4_conv2d_bn"
+  top: "mixed_7_tower_1_conv_4_conv2d_relu"
+}
+layer {
+  name: "AVE_pool_mixed_7_pool"
+  type: "Pooling"
+  bottom: "ch_concat_mixed_6_chconcat"
+  top: "AVE_pool_mixed_7_pool"
+  pooling_param {
+    pool: AVE
+    pad: 1
+    kernel_size: 3
+    stride: 1
+  }
+}
+layer {
+  name: "mixed_7_tower_2_conv_conv2d"
+  type: "Convolution"
+  bottom: "AVE_pool_mixed_7_pool"
+  top: "mixed_7_tower_2_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_7_tower_2_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_7_tower_2_conv_conv2d"
+  top: "mixed_7_tower_2_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_7_tower_2_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_7_tower_2_conv_conv2d_bn"
+  top: "mixed_7_tower_2_conv_conv2d_relu"
+}
+layer {
+  name: "ch_concat_mixed_7_chconcat"
+  type: "Concat"
+  bottom: "mixed_7_conv_conv2d_relu"
+  bottom: "mixed_7_tower_conv_2_conv2d_relu"
+  bottom: "mixed_7_tower_1_conv_4_conv2d_relu"
+  bottom: "mixed_7_tower_2_conv_conv2d_relu"
+  top: "ch_concat_mixed_7_chconcat"
+  concat_param {
+    axis: 1
+  }
+}
+layer {
+  name: "mixed_8_tower_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_7_chconcat"
+  top: "mixed_8_tower_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_8_tower_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_8_tower_conv_conv2d"
+  top: "mixed_8_tower_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_8_tower_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_8_tower_conv_conv2d_bn"
+  top: "mixed_8_tower_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_8_tower_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_8_tower_conv_conv2d_relu"
+  top: "mixed_8_tower_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 320
+    bias_term: false
+    pad: 0
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 6
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_8_tower_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_8_tower_conv_1_conv2d"
+  top: "mixed_8_tower_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_8_tower_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_8_tower_conv_1_conv2d_bn"
+  top: "mixed_8_tower_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_8_tower_1_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_7_chconcat"
+  top: "mixed_8_tower_1_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_8_tower_1_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_8_tower_1_conv_conv2d"
+  top: "mixed_8_tower_1_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_8_tower_1_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_8_tower_1_conv_conv2d_bn"
+  top: "mixed_8_tower_1_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_8_tower_1_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_8_tower_1_conv_conv2d_relu"
+  top: "mixed_8_tower_1_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 3
+    kernel_h: 1
+    kernel_w: 7
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 6
+    fl_params: 6
+  }
+}
+layer {
+  name: "mixed_8_tower_1_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_8_tower_1_conv_1_conv2d"
+  top: "mixed_8_tower_1_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_8_tower_1_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_8_tower_1_conv_1_conv2d_bn"
+  top: "mixed_8_tower_1_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_8_tower_1_conv_2_conv2d"
+  type: "Convolution"
+  bottom: "mixed_8_tower_1_conv_1_conv2d_relu"
+  top: "mixed_8_tower_1_conv_2_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 3
+    pad_w: 0
+    kernel_h: 7
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_8_tower_1_conv_2_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_8_tower_1_conv_2_conv2d"
+  top: "mixed_8_tower_1_conv_2_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_8_tower_1_conv_2_relu"
+  type: "ReLU"
+  bottom: "mixed_8_tower_1_conv_2_conv2d_bn"
+  top: "mixed_8_tower_1_conv_2_conv2d_relu"
+}
+layer {
+  name: "mixed_8_tower_1_conv_3_conv2d"
+  type: "Convolution"
+  bottom: "mixed_8_tower_1_conv_2_conv2d_relu"
+  top: "mixed_8_tower_1_conv_3_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_8_tower_1_conv_3_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_8_tower_1_conv_3_conv2d"
+  top: "mixed_8_tower_1_conv_3_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_8_tower_1_conv_3_relu"
+  type: "ReLU"
+  bottom: "mixed_8_tower_1_conv_3_conv2d_bn"
+  top: "mixed_8_tower_1_conv_3_conv2d_relu"
+}
+layer {
+  name: "MAX_pool_mixed_8_pool"
+  type: "Pooling"
+  bottom: "ch_concat_mixed_7_chconcat"
+  top: "MAX_pool_mixed_8_pool"
+  pooling_param {
+    pool: MAX
+    pad: 0
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "ch_concat_mixed_8_chconcat"
+  type: "Concat"
+  bottom: "mixed_8_tower_conv_1_conv2d_relu"
+  bottom: "mixed_8_tower_1_conv_3_conv2d_relu"
+  bottom: "MAX_pool_mixed_8_pool"
+  top: "ch_concat_mixed_8_chconcat"
+  concat_param {
+    axis: 1
+  }
+}
+layer {
+  name: "mixed_9_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_8_chconcat"
+  top: "mixed_9_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 320
+    bias_term: false
+    pad: 0
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    kernel_h: 1
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 8
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_9_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_9_conv_conv2d"
+  top: "mixed_9_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_9_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_9_conv_conv2d_bn"
+  top: "mixed_9_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_9_tower_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_8_chconcat"
+  top: "mixed_9_tower_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 384
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_9_tower_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_9_tower_conv_conv2d"
+  top: "mixed_9_tower_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_9_tower_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_9_tower_conv_conv2d_bn"
+  top: "mixed_9_tower_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_9_tower_mixed_conv_conv2d"
+  type: "Convolution"
+  bottom: "mixed_9_tower_conv_conv2d_relu"
+  top: "mixed_9_tower_mixed_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 384
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 1
+    kernel_h: 1
+    kernel_w: 3
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_9_tower_mixed_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_9_tower_mixed_conv_conv2d"
+  top: "mixed_9_tower_mixed_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_9_tower_mixed_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_9_tower_mixed_conv_conv2d_bn"
+  top: "mixed_9_tower_mixed_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_9_tower_mixed_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_9_tower_conv_conv2d_relu"
+  top: "mixed_9_tower_mixed_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 384
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 1
+    pad_w: 0
+    kernel_h: 3
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_9_tower_mixed_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_9_tower_mixed_conv_1_conv2d"
+  top: "mixed_9_tower_mixed_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_9_tower_mixed_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_9_tower_mixed_conv_1_conv2d_bn"
+  top: "mixed_9_tower_mixed_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_9_tower_1_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_8_chconcat"
+  top: "mixed_9_tower_1_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 448
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 7
+  }
+}
+layer {
+  name: "mixed_9_tower_1_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_9_tower_1_conv_conv2d"
+  top: "mixed_9_tower_1_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_9_tower_1_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_9_tower_1_conv_conv2d_bn"
+  top: "mixed_9_tower_1_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_9_tower_1_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_9_tower_1_conv_conv2d_relu"
+  top: "mixed_9_tower_1_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 384
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 6
+    fl_params: 9
+  }
+}
+layer {
+  name: "mixed_9_tower_1_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_9_tower_1_conv_1_conv2d"
+  top: "mixed_9_tower_1_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_9_tower_1_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_9_tower_1_conv_1_conv2d_bn"
+  top: "mixed_9_tower_1_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_9_tower_1_mixed_conv_conv2d"
+  type: "Convolution"
+  bottom: "mixed_9_tower_1_conv_1_conv2d_relu"
+  top: "mixed_9_tower_1_mixed_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 384
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 1
+    kernel_h: 1
+    kernel_w: 3
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 9
+  }
+}
+layer {
+  name: "mixed_9_tower_1_mixed_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_9_tower_1_mixed_conv_conv2d"
+  top: "mixed_9_tower_1_mixed_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_9_tower_1_mixed_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_9_tower_1_mixed_conv_conv2d_bn"
+  top: "mixed_9_tower_1_mixed_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_9_tower_1_mixed_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_9_tower_1_conv_1_conv2d_relu"
+  top: "mixed_9_tower_1_mixed_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 384
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 1
+    pad_w: 0
+    kernel_h: 3
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_9_tower_1_mixed_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_9_tower_1_mixed_conv_1_conv2d"
+  top: "mixed_9_tower_1_mixed_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_9_tower_1_mixed_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_9_tower_1_mixed_conv_1_conv2d_bn"
+  top: "mixed_9_tower_1_mixed_conv_1_conv2d_relu"
+}
+layer {
+  name: "AVE_pool_mixed_9_pool"
+  type: "Pooling"
+  bottom: "ch_concat_mixed_8_chconcat"
+  top: "AVE_pool_mixed_9_pool"
+  pooling_param {
+    pool: AVE
+    pad: 1
+    kernel_size: 3
+    stride: 1
+  }
+}
+layer {
+  name: "mixed_9_tower_2_conv_conv2d"
+  type: "Convolution"
+  bottom: "AVE_pool_mixed_9_pool"
+  top: "mixed_9_tower_2_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 8
+    fl_params: 6
+  }
+}
+layer {
+  name: "mixed_9_tower_2_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_9_tower_2_conv_conv2d"
+  top: "mixed_9_tower_2_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_9_tower_2_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_9_tower_2_conv_conv2d_bn"
+  top: "mixed_9_tower_2_conv_conv2d_relu"
+}
+layer {
+  name: "ch_concat_mixed_9_chconcat"
+  type: "Concat"
+  bottom: "mixed_9_conv_conv2d_relu"
+  bottom: "mixed_9_tower_mixed_conv_conv2d_relu"
+  bottom: "mixed_9_tower_mixed_conv_1_conv2d_relu"
+  bottom: "mixed_9_tower_1_mixed_conv_conv2d_relu"
+  bottom: "mixed_9_tower_1_mixed_conv_1_conv2d_relu"
+  bottom: "mixed_9_tower_2_conv_conv2d_relu"
+  top: "ch_concat_mixed_9_chconcat"
+  concat_param {
+    axis: 1
+  }
+}
+layer {
+  name: "mixed_10_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_9_chconcat"
+  top: "mixed_10_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 320
+    bias_term: false
+    pad: 0
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    kernel_h: 1
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 5
+    fl_params: 4
+  }
+}
+layer {
+  name: "mixed_10_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_10_conv_conv2d"
+  top: "mixed_10_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_10_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_10_conv_conv2d_bn"
+  top: "mixed_10_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_10_tower_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_9_chconcat"
+  top: "mixed_10_tower_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 384
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 6
+    fl_params: 6
+  }
+}
+layer {
+  name: "mixed_10_tower_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_10_tower_conv_conv2d"
+  top: "mixed_10_tower_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_10_tower_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_10_tower_conv_conv2d_bn"
+  top: "mixed_10_tower_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_10_tower_mixed_conv_conv2d"
+  type: "Convolution"
+  bottom: "mixed_10_tower_conv_conv2d_relu"
+  top: "mixed_10_tower_mixed_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 384
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 1
+    kernel_h: 1
+    kernel_w: 3
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 4
+    fl_params: 5
+  }
+}
+layer {
+  name: "mixed_10_tower_mixed_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_10_tower_mixed_conv_conv2d"
+  top: "mixed_10_tower_mixed_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_10_tower_mixed_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_10_tower_mixed_conv_conv2d_bn"
+  top: "mixed_10_tower_mixed_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_10_tower_mixed_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_10_tower_conv_conv2d_relu"
+  top: "mixed_10_tower_mixed_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 384
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 1
+    pad_w: 0
+    kernel_h: 3
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 4
+    fl_params: 5
+  }
+}
+layer {
+  name: "mixed_10_tower_mixed_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_10_tower_mixed_conv_1_conv2d"
+  top: "mixed_10_tower_mixed_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_10_tower_mixed_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_10_tower_mixed_conv_1_conv2d_bn"
+  top: "mixed_10_tower_mixed_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_10_tower_1_conv_conv2d"
+  type: "Convolution"
+  bottom: "ch_concat_mixed_9_chconcat"
+  top: "mixed_10_tower_1_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 448
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 6
+    fl_params: 6
+  }
+}
+layer {
+  name: "mixed_10_tower_1_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_10_tower_1_conv_conv2d"
+  top: "mixed_10_tower_1_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_10_tower_1_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_10_tower_1_conv_conv2d_bn"
+  top: "mixed_10_tower_1_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_10_tower_1_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_10_tower_1_conv_conv2d_relu"
+  top: "mixed_10_tower_1_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 384
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 6
+    fl_layer_out: 7
+    fl_params: 8
+  }
+}
+layer {
+  name: "mixed_10_tower_1_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_10_tower_1_conv_1_conv2d"
+  top: "mixed_10_tower_1_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_10_tower_1_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_10_tower_1_conv_1_conv2d_bn"
+  top: "mixed_10_tower_1_conv_1_conv2d_relu"
+}
+layer {
+  name: "mixed_10_tower_1_mixed_conv_conv2d"
+  type: "Convolution"
+  bottom: "mixed_10_tower_1_conv_1_conv2d_relu"
+  top: "mixed_10_tower_1_mixed_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 384
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 0
+    pad_w: 1
+    kernel_h: 1
+    kernel_w: 3
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 4
+    fl_params: 5
+  }
+}
+layer {
+  name: "mixed_10_tower_1_mixed_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_10_tower_1_mixed_conv_conv2d"
+  top: "mixed_10_tower_1_mixed_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_10_tower_1_mixed_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_10_tower_1_mixed_conv_conv2d_bn"
+  top: "mixed_10_tower_1_mixed_conv_conv2d_relu"
+}
+layer {
+  name: "mixed_10_tower_1_mixed_conv_1_conv2d"
+  type: "Convolution"
+  bottom: "mixed_10_tower_1_conv_1_conv2d_relu"
+  top: "mixed_10_tower_1_mixed_conv_1_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 384
+    bias_term: false
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+    pad_h: 1
+    pad_w: 0
+    kernel_h: 3
+    kernel_w: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 4
+    fl_params: 5
+  }
+}
+layer {
+  name: "mixed_10_tower_1_mixed_conv_1_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_10_tower_1_mixed_conv_1_conv2d"
+  top: "mixed_10_tower_1_mixed_conv_1_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_10_tower_1_mixed_conv_1_relu"
+  type: "ReLU"
+  bottom: "mixed_10_tower_1_mixed_conv_1_conv2d_bn"
+  top: "mixed_10_tower_1_mixed_conv_1_conv2d_relu"
+}
+layer {
+  name: "MAX_pool_mixed_10_pool"
+  type: "Pooling"
+  bottom: "ch_concat_mixed_9_chconcat"
+  top: "MAX_pool_mixed_10_pool"
+  pooling_param {
+    pool: MAX
+    pad: 1
+    kernel_size: 3
+    stride: 1
+  }
+}
+layer {
+  name: "mixed_10_tower_2_conv_conv2d"
+  type: "Convolution"
+  bottom: "MAX_pool_mixed_10_pool"
+  top: "mixed_10_tower_2_conv_conv2d"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  convolution_param {
+    num_output: 192
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "gaussian"
+      std: 0.01
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 7
+    fl_layer_out: 5
+    fl_params: 6
+  }
+}
+layer {
+  name: "mixed_10_tower_2_conv_batchnorm"
+  type: "BatchNorm"
+  bottom: "mixed_10_tower_2_conv_conv2d"
+  top: "mixed_10_tower_2_conv_conv2d_bn"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "mixed_10_tower_2_conv_relu"
+  type: "ReLU"
+  bottom: "mixed_10_tower_2_conv_conv2d_bn"
+  top: "mixed_10_tower_2_conv_conv2d_relu"
+}
+layer {
+  name: "ch_concat_mixed_10_chconcat"
+  type: "Concat"
+  bottom: "mixed_10_conv_conv2d_relu"
+  bottom: "mixed_10_tower_mixed_conv_conv2d_relu"
+  bottom: "mixed_10_tower_mixed_conv_1_conv2d_relu"
+  bottom: "mixed_10_tower_1_mixed_conv_conv2d_relu"
+  bottom: "mixed_10_tower_1_mixed_conv_1_conv2d_relu"
+  bottom: "mixed_10_tower_2_conv_conv2d_relu"
+  top: "ch_concat_mixed_10_chconcat"
+  concat_param {
+    axis: 1
+  }
+}
+layer {
+  name: "global_pool"
+  type: "Pooling"
+  bottom: "ch_concat_mixed_10_chconcat"
+  top: "global_pool"
+  pooling_param {
+    pool: AVE
+    pad: 0
+    kernel_size: 8
+    stride: 1
+  }
+}
+layer {
+  name: "drop"
+  type: "Dropout"
+  bottom: "global_pool"
+  top: "global_pool"
+  dropout_param {
+  }
+}
+layer {
+  name: "flatten"
+  type: "Flatten"
+  bottom: "global_pool"
+  top: "flatten"
+}
+layer {
+  name: "fc1"
+  type: "InnerProduct"
+  bottom: "flatten"
+  top: "fc1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
diff --git a/models/intel_optimized_models/int8/resnet50_int8.prototxt b/models/intel_optimized_models/int8/resnet50_int8.prototxt
new file mode 100644
index 000000000..2490f0be2
--- /dev/null
+++ b/models/intel_optimized_models/int8/resnet50_int8.prototxt
@@ -0,0 +1,3056 @@
+name: "ResNet-50"
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "data"
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+      value: 0.0099999997764825821
+    }    
+    shape {
+      dim: 50
+      dim: 3
+      dim: 224
+      dim: 224
+    }    
+  }
+}
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "label"
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+    }    
+    shape {
+      dim: 50
+    }    
+  }
+}
+layer {
+  name: "conv1"
+  type: "Convolution"
+  bottom: "data"
+  top: "conv1"
+  convolution_param {
+    num_output: 64
+    pad: 3
+    kernel_size: 7
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+}
+layer {
+  name: "bn_conv1"
+  type: "BatchNorm"
+  bottom: "conv1"
+  top: "conv1"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale_conv1"
+  type: "Scale"
+  bottom: "conv1"
+  top: "conv1"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "conv1_relu"
+  type: "ReLU"
+  bottom: "conv1"
+  top: "conv1"
+  relu_param {
+  }
+}
+layer {
+  name: "pool1"
+  type: "Pooling"
+  bottom: "conv1"
+  top: "pool1"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "res2a_branch1"
+  type: "Convolution"
+  bottom: "pool1"
+  top: "res2a_branch1"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 3
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn2a_branch1"
+  type: "BatchNorm"
+  bottom: "res2a_branch1"
+  top: "res2a_branch1"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2a_branch1"
+  type: "Scale"
+  bottom: "res2a_branch1"
+  top: "res2a_branch1"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2a_branch2a"
+  type: "Convolution"
+  bottom: "pool1"
+  top: "res2a_branch2a"
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 4
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn2a_branch2a"
+  type: "BatchNorm"
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2a_branch2a"
+  type: "Scale"
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2a_branch2a_relu"
+  type: "ReLU"
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res2a_branch2b"
+  type: "Convolution"
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2b"
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 4
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn2a_branch2b"
+  type: "BatchNorm"
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2a_branch2b"
+  type: "Scale"
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2a_branch2b_relu"
+  type: "ReLU"
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res2a_branch2c"
+  type: "Convolution"
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2c"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 3
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn2a_branch2c"
+  type: "BatchNorm"
+  bottom: "res2a_branch2c"
+  top: "res2a_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2a_branch2c"
+  type: "Scale"
+  bottom: "res2a_branch2c"
+  top: "res2a_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2a"
+  type: "Eltwise"
+  bottom: "res2a_branch1"
+  bottom: "res2a_branch2c"
+  top: "res2a"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res2a_relu"
+  type: "ReLU"
+  bottom: "res2a"
+  top: "res2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res2b_branch2a"
+  type: "Convolution"
+  bottom: "res2a"
+  top: "res2b_branch2a"
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 4
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn2b_branch2a"
+  type: "BatchNorm"
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2b_branch2a"
+  type: "Scale"
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2b_branch2a_relu"
+  type: "ReLU"
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res2b_branch2b"
+  type: "Convolution"
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2b"
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 4
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn2b_branch2b"
+  type: "BatchNorm"
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2b_branch2b"
+  type: "Scale"
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2b_branch2b_relu"
+  type: "ReLU"
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res2b_branch2c"
+  type: "Convolution"
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2c"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 3
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn2b_branch2c"
+  type: "BatchNorm"
+  bottom: "res2b_branch2c"
+  top: "res2b_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2b_branch2c"
+  type: "Scale"
+  bottom: "res2b_branch2c"
+  top: "res2b_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2b"
+  type: "Eltwise"
+  bottom: "res2a"
+  bottom: "res2b_branch2c"
+  top: "res2b"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res2b_relu"
+  type: "ReLU"
+  bottom: "res2b"
+  top: "res2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res2c_branch2a"
+  type: "Convolution"
+  bottom: "res2b"
+  top: "res2c_branch2a"
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 4
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn2c_branch2a"
+  type: "BatchNorm"
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2c_branch2a"
+  type: "Scale"
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2c_branch2a_relu"
+  type: "ReLU"
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res2c_branch2b"
+  type: "Convolution"
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2b"
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 3
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn2c_branch2b"
+  type: "BatchNorm"
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2c_branch2b"
+  type: "Scale"
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2c_branch2b_relu"
+  type: "ReLU"
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res2c_branch2c"
+  type: "Convolution"
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2c"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 3
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn2c_branch2c"
+  type: "BatchNorm"
+  bottom: "res2c_branch2c"
+  top: "res2c_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2c_branch2c"
+  type: "Scale"
+  bottom: "res2c_branch2c"
+  top: "res2c_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2c"
+  type: "Eltwise"
+  bottom: "res2b"
+  bottom: "res2c_branch2c"
+  top: "res2c"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res2c_relu"
+  type: "ReLU"
+  bottom: "res2c"
+  top: "res2c"
+  relu_param {
+  }
+}
+layer {
+  name: "res3a_branch1"
+  type: "Convolution"
+  bottom: "res2c"
+  top: "res3a_branch1"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 3
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn3a_branch1"
+  type: "BatchNorm"
+  bottom: "res3a_branch1"
+  top: "res3a_branch1"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3a_branch1"
+  type: "Scale"
+  bottom: "res3a_branch1"
+  top: "res3a_branch1"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3a_branch2a"
+  type: "Convolution"
+  bottom: "res2c"
+  top: "res3a_branch2a"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 4
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn3a_branch2a"
+  type: "BatchNorm"
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3a_branch2a"
+  type: "Scale"
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3a_branch2a_relu"
+  type: "ReLU"
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res3a_branch2b"
+  type: "Convolution"
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2b"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 4
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn3a_branch2b"
+  type: "BatchNorm"
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3a_branch2b"
+  type: "Scale"
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3a_branch2b_relu"
+  type: "ReLU"
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res3a_branch2c"
+  type: "Convolution"
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2c"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 3
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn3a_branch2c"
+  type: "BatchNorm"
+  bottom: "res3a_branch2c"
+  top: "res3a_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3a_branch2c"
+  type: "Scale"
+  bottom: "res3a_branch2c"
+  top: "res3a_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3a"
+  type: "Eltwise"
+  bottom: "res3a_branch1"
+  bottom: "res3a_branch2c"
+  top: "res3a"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res3a_relu"
+  type: "ReLU"
+  bottom: "res3a"
+  top: "res3a"
+  relu_param {
+  }
+}
+layer {
+  name: "res3b_branch2a"
+  type: "Convolution"
+  bottom: "res3a"
+  top: "res3b_branch2a"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 4
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn3b_branch2a"
+  type: "BatchNorm"
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3b_branch2a"
+  type: "Scale"
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3b_branch2a_relu"
+  type: "ReLU"
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res3b_branch2b"
+  type: "Convolution"
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2b"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 4
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn3b_branch2b"
+  type: "BatchNorm"
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3b_branch2b"
+  type: "Scale"
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3b_branch2b_relu"
+  type: "ReLU"
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res3b_branch2c"
+  type: "Convolution"
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2c"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 3
+    fl_params: 5
+  }
+}
+layer {
+  name: "bn3b_branch2c"
+  type: "BatchNorm"
+  bottom: "res3b_branch2c"
+  top: "res3b_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3b_branch2c"
+  type: "Scale"
+  bottom: "res3b_branch2c"
+  top: "res3b_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3b"
+  type: "Eltwise"
+  bottom: "res3a"
+  bottom: "res3b_branch2c"
+  top: "res3b"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res3b_relu"
+  type: "ReLU"
+  bottom: "res3b"
+  top: "res3b"
+  relu_param {
+  }
+}
+layer {
+  name: "res3c_branch2a"
+  type: "Convolution"
+  bottom: "res3b"
+  top: "res3c_branch2a"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 3
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn3c_branch2a"
+  type: "BatchNorm"
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3c_branch2a"
+  type: "Scale"
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3c_branch2a_relu"
+  type: "ReLU"
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res3c_branch2b"
+  type: "Convolution"
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2b"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 1
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn3c_branch2b"
+  type: "BatchNorm"
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3c_branch2b"
+  type: "Scale"
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3c_branch2b_relu"
+  type: "ReLU"
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res3c_branch2c"
+  type: "Convolution"
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2c"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 1
+    fl_layer_out: 3
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn3c_branch2c"
+  type: "BatchNorm"
+  bottom: "res3c_branch2c"
+  top: "res3c_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3c_branch2c"
+  type: "Scale"
+  bottom: "res3c_branch2c"
+  top: "res3c_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3c"
+  type: "Eltwise"
+  bottom: "res3b"
+  bottom: "res3c_branch2c"
+  top: "res3c"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res3c_relu"
+  type: "ReLU"
+  bottom: "res3c"
+  top: "res3c"
+  relu_param {
+  }
+}
+layer {
+  name: "res3d_branch2a"
+  type: "Convolution"
+  bottom: "res3c"
+  top: "res3d_branch2a"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 2
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn3d_branch2a"
+  type: "BatchNorm"
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3d_branch2a"
+  type: "Scale"
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3d_branch2a_relu"
+  type: "ReLU"
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res3d_branch2b"
+  type: "Convolution"
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2b"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 3
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn3d_branch2b"
+  type: "BatchNorm"
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3d_branch2b"
+  type: "Scale"
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3d_branch2b_relu"
+  type: "ReLU"
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res3d_branch2c"
+  type: "Convolution"
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2c"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 3
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn3d_branch2c"
+  type: "BatchNorm"
+  bottom: "res3d_branch2c"
+  top: "res3d_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3d_branch2c"
+  type: "Scale"
+  bottom: "res3d_branch2c"
+  top: "res3d_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3d"
+  type: "Eltwise"
+  bottom: "res3c"
+  bottom: "res3d_branch2c"
+  top: "res3d"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res3d_relu"
+  type: "ReLU"
+  bottom: "res3d"
+  top: "res3d"
+  relu_param {
+  }
+}
+layer {
+  name: "res4a_branch1"
+  type: "Convolution"
+  bottom: "res3d"
+  top: "res4a_branch1"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 2
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn4a_branch1"
+  type: "BatchNorm"
+  bottom: "res4a_branch1"
+  top: "res4a_branch1"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4a_branch1"
+  type: "Scale"
+  bottom: "res4a_branch1"
+  top: "res4a_branch1"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4a_branch2a"
+  type: "Convolution"
+  bottom: "res3d"
+  top: "res4a_branch2a"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 3
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn4a_branch2a"
+  type: "BatchNorm"
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4a_branch2a"
+  type: "Scale"
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4a_branch2a_relu"
+  type: "ReLU"
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4a_branch2b"
+  type: "Convolution"
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2b"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 3
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn4a_branch2b"
+  type: "BatchNorm"
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4a_branch2b"
+  type: "Scale"
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4a_branch2b_relu"
+  type: "ReLU"
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4a_branch2c"
+  type: "Convolution"
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2c"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 2
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn4a_branch2c"
+  type: "BatchNorm"
+  bottom: "res4a_branch2c"
+  top: "res4a_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4a_branch2c"
+  type: "Scale"
+  bottom: "res4a_branch2c"
+  top: "res4a_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4a"
+  type: "Eltwise"
+  bottom: "res4a_branch1"
+  bottom: "res4a_branch2c"
+  top: "res4a"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res4a_relu"
+  type: "ReLU"
+  bottom: "res4a"
+  top: "res4a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4b_branch2a"
+  type: "Convolution"
+  bottom: "res4a"
+  top: "res4b_branch2a"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 3
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn4b_branch2a"
+  type: "BatchNorm"
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4b_branch2a"
+  type: "Scale"
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4b_branch2a_relu"
+  type: "ReLU"
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4b_branch2b"
+  type: "Convolution"
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2b"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 2
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn4b_branch2b"
+  type: "BatchNorm"
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4b_branch2b"
+  type: "Scale"
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4b_branch2b_relu"
+  type: "ReLU"
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4b_branch2c"
+  type: "Convolution"
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2c"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 2
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn4b_branch2c"
+  type: "BatchNorm"
+  bottom: "res4b_branch2c"
+  top: "res4b_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4b_branch2c"
+  type: "Scale"
+  bottom: "res4b_branch2c"
+  top: "res4b_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4b"
+  type: "Eltwise"
+  bottom: "res4a"
+  bottom: "res4b_branch2c"
+  top: "res4b"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res4b_relu"
+  type: "ReLU"
+  bottom: "res4b"
+  top: "res4b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4c_branch2a"
+  type: "Convolution"
+  bottom: "res4b"
+  top: "res4c_branch2a"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 3
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn4c_branch2a"
+  type: "BatchNorm"
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4c_branch2a"
+  type: "Scale"
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4c_branch2a_relu"
+  type: "ReLU"
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4c_branch2b"
+  type: "Convolution"
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2b"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 2
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn4c_branch2b"
+  type: "BatchNorm"
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4c_branch2b"
+  type: "Scale"
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4c_branch2b_relu"
+  type: "ReLU"
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4c_branch2c"
+  type: "Convolution"
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2c"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 2
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn4c_branch2c"
+  type: "BatchNorm"
+  bottom: "res4c_branch2c"
+  top: "res4c_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4c_branch2c"
+  type: "Scale"
+  bottom: "res4c_branch2c"
+  top: "res4c_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4c"
+  type: "Eltwise"
+  bottom: "res4b"
+  bottom: "res4c_branch2c"
+  top: "res4c"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res4c_relu"
+  type: "ReLU"
+  bottom: "res4c"
+  top: "res4c"
+  relu_param {
+  }
+}
+layer {
+  name: "res4d_branch2a"
+  type: "Convolution"
+  bottom: "res4c"
+  top: "res4d_branch2a"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 3
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn4d_branch2a"
+  type: "BatchNorm"
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4d_branch2a"
+  type: "Scale"
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4d_branch2a_relu"
+  type: "ReLU"
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4d_branch2b"
+  type: "Convolution"
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2b"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 2
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn4d_branch2b"
+  type: "BatchNorm"
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4d_branch2b"
+  type: "Scale"
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4d_branch2b_relu"
+  type: "ReLU"
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4d_branch2c"
+  type: "Convolution"
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2c"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 2
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn4d_branch2c"
+  type: "BatchNorm"
+  bottom: "res4d_branch2c"
+  top: "res4d_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4d_branch2c"
+  type: "Scale"
+  bottom: "res4d_branch2c"
+  top: "res4d_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4d"
+  type: "Eltwise"
+  bottom: "res4c"
+  bottom: "res4d_branch2c"
+  top: "res4d"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res4d_relu"
+  type: "ReLU"
+  bottom: "res4d"
+  top: "res4d"
+  relu_param {
+  }
+}
+layer {
+  name: "res4e_branch2a"
+  type: "Convolution"
+  bottom: "res4d"
+  top: "res4e_branch2a"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 3
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn4e_branch2a"
+  type: "BatchNorm"
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4e_branch2a"
+  type: "Scale"
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4e_branch2a_relu"
+  type: "ReLU"
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4e_branch2b"
+  type: "Convolution"
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2b"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 2
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn4e_branch2b"
+  type: "BatchNorm"
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4e_branch2b"
+  type: "Scale"
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4e_branch2b_relu"
+  type: "ReLU"
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4e_branch2c"
+  type: "Convolution"
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2c"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 2
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn4e_branch2c"
+  type: "BatchNorm"
+  bottom: "res4e_branch2c"
+  top: "res4e_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4e_branch2c"
+  type: "Scale"
+  bottom: "res4e_branch2c"
+  top: "res4e_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4e"
+  type: "Eltwise"
+  bottom: "res4d"
+  bottom: "res4e_branch2c"
+  top: "res4e"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res4e_relu"
+  type: "ReLU"
+  bottom: "res4e"
+  top: "res4e"
+  relu_param {
+  }
+}
+layer {
+  name: "res4f_branch2a"
+  type: "Convolution"
+  bottom: "res4e"
+  top: "res4f_branch2a"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 4
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn4f_branch2a"
+  type: "BatchNorm"
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4f_branch2a"
+  type: "Scale"
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4f_branch2a_relu"
+  type: "ReLU"
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4f_branch2b"
+  type: "Convolution"
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2b"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 2
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn4f_branch2b"
+  type: "BatchNorm"
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4f_branch2b"
+  type: "Scale"
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4f_branch2b_relu"
+  type: "ReLU"
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4f_branch2c"
+  type: "Convolution"
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2c"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 2
+    fl_params: 6
+  }
+}
+layer {
+  name: "bn4f_branch2c"
+  type: "BatchNorm"
+  bottom: "res4f_branch2c"
+  top: "res4f_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4f_branch2c"
+  type: "Scale"
+  bottom: "res4f_branch2c"
+  top: "res4f_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4f"
+  type: "Eltwise"
+  bottom: "res4e"
+  bottom: "res4f_branch2c"
+  top: "res4f"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res4f_relu"
+  type: "ReLU"
+  bottom: "res4f"
+  top: "res4f"
+  relu_param {
+  }
+}
+layer {
+  name: "res5a_branch1"
+  type: "Convolution"
+  bottom: "res4f"
+  top: "res5a_branch1"
+  convolution_param {
+    num_output: 2048
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 0
+    fl_params: 5
+  }
+}
+layer {
+  name: "bn5a_branch1"
+  type: "BatchNorm"
+  bottom: "res5a_branch1"
+  top: "res5a_branch1"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5a_branch1"
+  type: "Scale"
+  bottom: "res5a_branch1"
+  top: "res5a_branch1"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5a_branch2a"
+  type: "Convolution"
+  bottom: "res4f"
+  top: "res5a_branch2a"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 4
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn5a_branch2a"
+  type: "BatchNorm"
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5a_branch2a"
+  type: "Scale"
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5a_branch2a_relu"
+  type: "ReLU"
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res5a_branch2b"
+  type: "Convolution"
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2b"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 4
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn5a_branch2b"
+  type: "BatchNorm"
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5a_branch2b"
+  type: "Scale"
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5a_branch2b_relu"
+  type: "ReLU"
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res5a_branch2c"
+  type: "Convolution"
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2c"
+  convolution_param {
+    num_output: 2048
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 0
+    fl_params: 4
+  }
+}
+layer {
+  name: "bn5a_branch2c"
+  type: "BatchNorm"
+  bottom: "res5a_branch2c"
+  top: "res5a_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5a_branch2c"
+  type: "Scale"
+  bottom: "res5a_branch2c"
+  top: "res5a_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5a"
+  type: "Eltwise"
+  bottom: "res5a_branch1"
+  bottom: "res5a_branch2c"
+  top: "res5a"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res5a_relu"
+  type: "ReLU"
+  bottom: "res5a"
+  top: "res5a"
+  relu_param {
+  }
+}
+layer {
+  name: "res5b_branch2a"
+  type: "Convolution"
+  bottom: "res5a"
+  top: "res5b_branch2a"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 0
+    fl_layer_out: 4
+    fl_params: 9
+  }
+}
+layer {
+  name: "bn5b_branch2a"
+  type: "BatchNorm"
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5b_branch2a"
+  type: "Scale"
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5b_branch2a_relu"
+  type: "ReLU"
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res5b_branch2b"
+  type: "Convolution"
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2b"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 4
+    fl_params: 7
+  }
+}
+layer {
+  name: "bn5b_branch2b"
+  type: "BatchNorm"
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5b_branch2b"
+  type: "Scale"
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5b_branch2b_relu"
+  type: "ReLU"
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res5b_branch2c"
+  type: "Convolution"
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2c"
+  convolution_param {
+    num_output: 2048
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 0
+    fl_params: 5
+  }
+}
+layer {
+  name: "bn5b_branch2c"
+  type: "BatchNorm"
+  bottom: "res5b_branch2c"
+  top: "res5b_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5b_branch2c"
+  type: "Scale"
+  bottom: "res5b_branch2c"
+  top: "res5b_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5b"
+  type: "Eltwise"
+  bottom: "res5a"
+  bottom: "res5b_branch2c"
+  top: "res5b"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res5b_relu"
+  type: "ReLU"
+  bottom: "res5b"
+  top: "res5b"
+  relu_param {
+  }
+}
+layer {
+  name: "res5c_branch2a"
+  type: "Convolution"
+  bottom: "res5b"
+  top: "res5c_branch2a"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 0
+    fl_layer_out: 4
+    fl_params: 9
+  }
+}
+layer {
+  name: "bn5c_branch2a"
+  type: "BatchNorm"
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5c_branch2a"
+  type: "Scale"
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5c_branch2a_relu"
+  type: "ReLU"
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res5c_branch2b"
+  type: "Convolution"
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2b"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 3
+    fl_params: 8
+  }
+}
+layer {
+  name: "bn5c_branch2b"
+  type: "BatchNorm"
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5c_branch2b"
+  type: "Scale"
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5c_branch2b_relu"
+  type: "ReLU"
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res5c_branch2c"
+  type: "Convolution"
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2c"
+  convolution_param {
+    num_output: 2048
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.2
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 0
+    fl_params: 4
+  }
+}
+layer {
+  name: "bn5c_branch2c"
+  type: "BatchNorm"
+  bottom: "res5c_branch2c"
+  top: "res5c_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5c_branch2c"
+  type: "Scale"
+  bottom: "res5c_branch2c"
+  top: "res5c_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5c"
+  type: "Eltwise"
+  bottom: "res5b"
+  bottom: "res5c_branch2c"
+  top: "res5c"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res5c_relu"
+  type: "ReLU"
+  bottom: "res5c"
+  top: "res5c"
+  relu_param {
+  }
+}
+layer {
+  name: "pool5"
+  type: "Pooling"
+  bottom: "res5c"
+  top: "pool5"
+  pooling_param {
+    pool: AVE
+    kernel_size: 7
+    stride: 1
+  }
+}
+layer {
+  name: "fc1000"
+  type: "InnerProduct"
+  bottom: "pool5"
+  top: "fc1000"
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "accuracy/top-1"
+  type: "Accuracy"
+  bottom: "fc1000"
+  bottom: "label"
+  top: "accuracy-top1"
+  include {
+    phase: TEST 
+  }
+}
+layer {
+  name: "accuracy/top-5"
+  type: "Accuracy"
+  bottom: "fc1000"
+  bottom: "label"
+  top: "accuracy-top5"
+  include {
+    phase: TEST 
+  }
+  accuracy_param {
+    top_k: 5
+  }
+}
diff --git a/models/intel_optimized_models/int8/ssd_int8.prototxt b/models/intel_optimized_models/int8/ssd_int8.prototxt
new file mode 100644
index 000000000..583b1962f
--- /dev/null
+++ b/models/intel_optimized_models/int8/ssd_int8.prototxt
@@ -0,0 +1,1864 @@
+name: "VGG_VOC0712_SSD_300x300_test"
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "data"
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+      value: 0.01
+    }
+    shape {
+      dim: 32
+      dim: 3
+      dim: 300
+      dim: 300
+    }
+  }
+}
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "label"
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+      value: 1
+    }
+    shape {
+      dim: 1
+      dim: 1
+      dim: 1
+      dim: 8
+    }
+  }
+}
+layer {
+  name: "conv1_1"
+  type: "Convolution"
+  bottom: "data"
+  top: "conv1_1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "relu1_1"
+  type: "ReLU"
+  bottom: "conv1_1"
+  top: "conv1_1"
+}
+layer {
+  name: "conv1_2"
+  type: "Convolution"
+  bottom: "conv1_1"
+  top: "conv1_2"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 64
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: -2
+    fl_layer_out: -4
+    fl_params: 8
+  }
+}
+layer {
+  name: "relu1_2"
+  type: "ReLU"
+  bottom: "conv1_2"
+  top: "conv1_2"
+}
+layer {
+  name: "pool1"
+  type: "Pooling"
+  bottom: "conv1_2"
+  top: "pool1"
+  pooling_param {
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  name: "conv2_1"
+  type: "Convolution"
+  bottom: "pool1"
+  top: "conv2_1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: -4
+    fl_layer_out: -5
+    fl_params: 8
+  }
+}
+layer {
+  name: "relu2_1"
+  type: "ReLU"
+  bottom: "conv2_1"
+  top: "conv2_1"
+}
+layer {
+  name: "conv2_2"
+  type: "Convolution"
+  bottom: "conv2_1"
+  top: "conv2_2"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: -5
+    fl_layer_out: -5
+    fl_params: 9
+  }
+}
+layer {
+  name: "relu2_2"
+  type: "ReLU"
+  bottom: "conv2_2"
+  top: "conv2_2"
+}
+layer {
+  name: "pool2"
+  type: "Pooling"
+  bottom: "conv2_2"
+  top: "pool2"
+  pooling_param {
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  name: "conv3_1"
+  type: "Convolution"
+  bottom: "pool2"
+  top: "conv3_1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: -5
+    fl_layer_out: -5
+    fl_params: 8
+  }
+}
+layer {
+  name: "relu3_1"
+  type: "ReLU"
+  bottom: "conv3_1"
+  top: "conv3_1"
+}
+layer {
+  name: "conv3_2"
+  type: "Convolution"
+  bottom: "conv3_1"
+  top: "conv3_2"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: -5
+    fl_layer_out: -5
+    fl_params: 8
+  }
+}
+layer {
+  name: "relu3_2"
+  type: "ReLU"
+  bottom: "conv3_2"
+  top: "conv3_2"
+}
+layer {
+  name: "conv3_3"
+  type: "Convolution"
+  bottom: "conv3_2"
+  top: "conv3_3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: -5
+    fl_layer_out: -5
+    fl_params: 8
+  }
+}
+layer {
+  name: "relu3_3"
+  type: "ReLU"
+  bottom: "conv3_3"
+  top: "conv3_3"
+}
+layer {
+  name: "pool3"
+  type: "Pooling"
+  bottom: "conv3_3"
+  top: "pool3"
+  pooling_param {
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  name: "conv4_1"
+  type: "Convolution"
+  bottom: "pool3"
+  top: "conv4_1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: -5
+    fl_layer_out: -4
+    fl_params: 8
+  }
+}
+layer {
+  name: "relu4_1"
+  type: "ReLU"
+  bottom: "conv4_1"
+  top: "conv4_1"
+}
+layer {
+  name: "conv4_2"
+  type: "Convolution"
+  bottom: "conv4_1"
+  top: "conv4_2"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: -4
+    fl_layer_out: -3
+    fl_params: 8
+  }
+}
+layer {
+  name: "relu4_2"
+  type: "ReLU"
+  bottom: "conv4_2"
+  top: "conv4_2"
+}
+layer {
+  name: "conv4_3"
+  type: "Convolution"
+  bottom: "conv4_2"
+  top: "conv4_3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: -3
+    fl_layer_out: -2
+    fl_params: 9
+  }
+}
+layer {
+  name: "relu4_3"
+  type: "ReLU"
+  bottom: "conv4_3"
+  top: "conv4_3"
+}
+layer {
+  name: "pool4"
+  type: "Pooling"
+  bottom: "conv4_3"
+  top: "pool4"
+  pooling_param {
+    pool: MAX
+    kernel_size: 2
+    stride: 2
+  }
+}
+layer {
+  name: "conv5_1"
+  type: "Convolution"
+  bottom: "pool4"
+  top: "conv5_1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+    dilation: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: -2
+    fl_layer_out: -1
+    fl_params: 9
+  }
+}
+layer {
+  name: "relu5_1"
+  type: "ReLU"
+  bottom: "conv5_1"
+  top: "conv5_1"
+}
+layer {
+  name: "conv5_2"
+  type: "Convolution"
+  bottom: "conv5_1"
+  top: "conv5_2"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+    dilation: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: -1
+    fl_layer_out: 0
+    fl_params: 9
+  }
+}
+layer {
+  name: "relu5_2"
+  type: "ReLU"
+  bottom: "conv5_2"
+  top: "conv5_2"
+}
+layer {
+  name: "conv5_3"
+  type: "Convolution"
+  bottom: "conv5_2"
+  top: "conv5_3"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+    dilation: 1
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 0
+    fl_layer_out: 0
+    fl_params: 9
+  }
+}
+layer {
+  name: "relu5_3"
+  type: "ReLU"
+  bottom: "conv5_3"
+  top: "conv5_3"
+}
+layer {
+  name: "pool5"
+  type: "Pooling"
+  bottom: "conv5_3"
+  top: "pool5"
+  pooling_param {
+    pool: MAX
+    pad: 1
+    kernel_size: 3
+    stride: 1
+  }
+}
+layer {
+  name: "fc6"
+  type: "Convolution"
+  bottom: "pool5"
+  top: "fc6"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 1024
+    pad: 6
+    kernel_size: 3
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+    engine: CAFFE
+    dilation: 6
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 0
+    fl_layer_out: 2
+    fl_params: 9
+  }
+}
+layer {
+  name: "relu6"
+  type: "ReLU"
+  bottom: "fc6"
+  top: "fc6"
+}
+layer {
+  name: "fc7"
+  type: "Convolution"
+  bottom: "fc6"
+  top: "fc7"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 1024
+    kernel_size: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 2
+    fl_layer_out: 4
+    fl_params: 9
+  }
+}
+layer {
+  name: "relu7"
+  type: "ReLU"
+  bottom: "fc7"
+  top: "fc7"
+}
+layer {
+  name: "conv6_1"
+  type: "Convolution"
+  bottom: "fc7"
+  top: "conv6_1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 5
+    fl_params: 9
+  }
+}
+layer {
+  name: "conv6_1_relu"
+  type: "ReLU"
+  bottom: "conv6_1"
+  top: "conv6_1"
+}
+layer {
+  name: "conv6_2"
+  type: "Convolution"
+  bottom: "conv6_1"
+  top: "conv6_2"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 512
+    pad: 1
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 5
+    fl_layer_out: 5
+    fl_params: 10
+  }
+}
+layer {
+  name: "conv6_2_relu"
+  type: "ReLU"
+  bottom: "conv6_2"
+  top: "conv6_2"
+}
+layer {
+  name: "conv7_1"
+  type: "Convolution"
+  bottom: "conv6_2"
+  top: "conv7_1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 5
+    fl_layer_out: 4
+    fl_params: 9
+  }
+}
+layer {
+  name: "conv7_1_relu"
+  type: "ReLU"
+  bottom: "conv7_1"
+  top: "conv7_1"
+}
+layer {
+  name: "conv7_2"
+  type: "Convolution"
+  bottom: "conv7_1"
+  top: "conv7_2"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    pad: 1
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 3
+    fl_params: 10
+  }
+}
+layer {
+  name: "conv7_2_relu"
+  type: "ReLU"
+  bottom: "conv7_2"
+  top: "conv7_2"
+}
+layer {
+  name: "conv8_1"
+  type: "Convolution"
+  bottom: "conv7_2"
+  top: "conv8_1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 4
+    fl_params: 9
+  }
+}
+layer {
+  name: "conv8_1_relu"
+  type: "ReLU"
+  bottom: "conv8_1"
+  top: "conv8_1"
+}
+layer {
+  name: "conv8_2"
+  type: "Convolution"
+  bottom: "conv8_1"
+  top: "conv8_2"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    pad: 0
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 4
+    fl_params: 10
+  }
+}
+layer {
+  name: "conv8_2_relu"
+  type: "ReLU"
+  bottom: "conv8_2"
+  top: "conv8_2"
+}
+layer {
+  name: "conv9_1"
+  type: "Convolution"
+  bottom: "conv8_2"
+  top: "conv9_1"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 128
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 4
+    fl_params: 9
+  }
+}
+layer {
+  name: "conv9_1_relu"
+  type: "ReLU"
+  bottom: "conv9_1"
+  top: "conv9_1"
+}
+layer {
+  name: "conv9_2"
+  type: "Convolution"
+  bottom: "conv9_1"
+  top: "conv9_2"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 256
+    pad: 0
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 3
+    fl_params: 10
+  }
+}
+layer {
+  name: "conv9_2_relu"
+  type: "ReLU"
+  bottom: "conv9_2"
+  top: "conv9_2"
+}
+layer {
+  name: "conv4_3_norm"
+  type: "Normalize"
+  bottom: "conv4_3"
+  top: "conv4_3_norm"
+  norm_param {
+    across_spatial: false
+    scale_filler {
+      type: "constant"
+      value: 20
+    }
+    channel_shared: false
+  }
+}
+layer {
+  name: "conv4_3_norm_mbox_loc"
+  type: "Convolution"
+  bottom: "conv4_3_norm"
+  top: "conv4_3_norm_mbox_loc"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 16
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "conv4_3_norm_mbox_loc_perm"
+  type: "Permute"
+  bottom: "conv4_3_norm_mbox_loc"
+  top: "conv4_3_norm_mbox_loc_perm"
+  permute_param {
+    order: 0
+    order: 2
+    order: 3
+    order: 1
+  }
+}
+layer {
+  name: "conv4_3_norm_mbox_loc_flat"
+  type: "Flatten"
+  bottom: "conv4_3_norm_mbox_loc_perm"
+  top: "conv4_3_norm_mbox_loc_flat"
+  flatten_param {
+    axis: 1
+  }
+}
+layer {
+  name: "conv4_3_norm_mbox_conf"
+  type: "Convolution"
+  bottom: "conv4_3_norm"
+  top: "conv4_3_norm_mbox_conf"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 84
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "conv4_3_norm_mbox_conf_perm"
+  type: "Permute"
+  bottom: "conv4_3_norm_mbox_conf"
+  top: "conv4_3_norm_mbox_conf_perm"
+  permute_param {
+    order: 0
+    order: 2
+    order: 3
+    order: 1
+  }
+}
+layer {
+  name: "conv4_3_norm_mbox_conf_flat"
+  type: "Flatten"
+  bottom: "conv4_3_norm_mbox_conf_perm"
+  top: "conv4_3_norm_mbox_conf_flat"
+  flatten_param {
+    axis: 1
+  }
+}
+layer {
+  name: "conv4_3_norm_mbox_priorbox"
+  type: "PriorBox"
+  bottom: "conv4_3_norm"
+  bottom: "data"
+  top: "conv4_3_norm_mbox_priorbox"
+  prior_box_param {
+    min_size: 30
+    max_size: 60
+    aspect_ratio: 2
+    flip: true
+    clip: false
+    variance: 0.1
+    variance: 0.1
+    variance: 0.2
+    variance: 0.2
+    step: 8
+    offset: 0.5
+  }
+}
+layer {
+  name: "fc7_mbox_loc"
+  type: "Convolution"
+  bottom: "fc7"
+  top: "fc7_mbox_loc"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 24
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "fc7_mbox_loc_perm"
+  type: "Permute"
+  bottom: "fc7_mbox_loc"
+  top: "fc7_mbox_loc_perm"
+  permute_param {
+    order: 0
+    order: 2
+    order: 3
+    order: 1
+  }
+}
+layer {
+  name: "fc7_mbox_loc_flat"
+  type: "Flatten"
+  bottom: "fc7_mbox_loc_perm"
+  top: "fc7_mbox_loc_flat"
+  flatten_param {
+    axis: 1
+  }
+}
+layer {
+  name: "fc7_mbox_conf"
+  type: "Convolution"
+  bottom: "fc7"
+  top: "fc7_mbox_conf"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 126
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "fc7_mbox_conf_perm"
+  type: "Permute"
+  bottom: "fc7_mbox_conf"
+  top: "fc7_mbox_conf_perm"
+  permute_param {
+    order: 0
+    order: 2
+    order: 3
+    order: 1
+  }
+}
+layer {
+  name: "fc7_mbox_conf_flat"
+  type: "Flatten"
+  bottom: "fc7_mbox_conf_perm"
+  top: "fc7_mbox_conf_flat"
+  flatten_param {
+    axis: 1
+  }
+}
+layer {
+  name: "fc7_mbox_priorbox"
+  type: "PriorBox"
+  bottom: "fc7"
+  bottom: "data"
+  top: "fc7_mbox_priorbox"
+  prior_box_param {
+    min_size: 60
+    max_size: 111
+    aspect_ratio: 2
+    aspect_ratio: 3
+    flip: true
+    clip: false
+    variance: 0.1
+    variance: 0.1
+    variance: 0.2
+    variance: 0.2
+    step: 16
+    offset: 0.5
+  }
+}
+layer {
+  name: "conv6_2_mbox_loc"
+  type: "Convolution"
+  bottom: "conv6_2"
+  top: "conv6_2_mbox_loc"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 24
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "conv6_2_mbox_loc_perm"
+  type: "Permute"
+  bottom: "conv6_2_mbox_loc"
+  top: "conv6_2_mbox_loc_perm"
+  permute_param {
+    order: 0
+    order: 2
+    order: 3
+    order: 1
+  }
+}
+layer {
+  name: "conv6_2_mbox_loc_flat"
+  type: "Flatten"
+  bottom: "conv6_2_mbox_loc_perm"
+  top: "conv6_2_mbox_loc_flat"
+  flatten_param {
+    axis: 1
+  }
+}
+layer {
+  name: "conv6_2_mbox_conf"
+  type: "Convolution"
+  bottom: "conv6_2"
+  top: "conv6_2_mbox_conf"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 126
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "conv6_2_mbox_conf_perm"
+  type: "Permute"
+  bottom: "conv6_2_mbox_conf"
+  top: "conv6_2_mbox_conf_perm"
+  permute_param {
+    order: 0
+    order: 2
+    order: 3
+    order: 1
+  }
+}
+layer {
+  name: "conv6_2_mbox_conf_flat"
+  type: "Flatten"
+  bottom: "conv6_2_mbox_conf_perm"
+  top: "conv6_2_mbox_conf_flat"
+  flatten_param {
+    axis: 1
+  }
+}
+layer {
+  name: "conv6_2_mbox_priorbox"
+  type: "PriorBox"
+  bottom: "conv6_2"
+  bottom: "data"
+  top: "conv6_2_mbox_priorbox"
+  prior_box_param {
+    min_size: 111
+    max_size: 162
+    aspect_ratio: 2
+    aspect_ratio: 3
+    flip: true
+    clip: false
+    variance: 0.1
+    variance: 0.1
+    variance: 0.2
+    variance: 0.2
+    step: 32
+    offset: 0.5
+  }
+}
+layer {
+  name: "conv7_2_mbox_loc"
+  type: "Convolution"
+  bottom: "conv7_2"
+  top: "conv7_2_mbox_loc"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 24
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "conv7_2_mbox_loc_perm"
+  type: "Permute"
+  bottom: "conv7_2_mbox_loc"
+  top: "conv7_2_mbox_loc_perm"
+  permute_param {
+    order: 0
+    order: 2
+    order: 3
+    order: 1
+  }
+}
+layer {
+  name: "conv7_2_mbox_loc_flat"
+  type: "Flatten"
+  bottom: "conv7_2_mbox_loc_perm"
+  top: "conv7_2_mbox_loc_flat"
+  flatten_param {
+    axis: 1
+  }
+}
+layer {
+  name: "conv7_2_mbox_conf"
+  type: "Convolution"
+  bottom: "conv7_2"
+  top: "conv7_2_mbox_conf"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 126
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "conv7_2_mbox_conf_perm"
+  type: "Permute"
+  bottom: "conv7_2_mbox_conf"
+  top: "conv7_2_mbox_conf_perm"
+  permute_param {
+    order: 0
+    order: 2
+    order: 3
+    order: 1
+  }
+}
+layer {
+  name: "conv7_2_mbox_conf_flat"
+  type: "Flatten"
+  bottom: "conv7_2_mbox_conf_perm"
+  top: "conv7_2_mbox_conf_flat"
+  flatten_param {
+    axis: 1
+  }
+}
+layer {
+  name: "conv7_2_mbox_priorbox"
+  type: "PriorBox"
+  bottom: "conv7_2"
+  bottom: "data"
+  top: "conv7_2_mbox_priorbox"
+  prior_box_param {
+    min_size: 162
+    max_size: 213
+    aspect_ratio: 2
+    aspect_ratio: 3
+    flip: true
+    clip: false
+    variance: 0.1
+    variance: 0.1
+    variance: 0.2
+    variance: 0.2
+    step: 64
+    offset: 0.5
+  }
+}
+layer {
+  name: "conv8_2_mbox_loc"
+  type: "Convolution"
+  bottom: "conv8_2"
+  top: "conv8_2_mbox_loc"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 16
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 4
+    fl_layer_out: 5
+    fl_params: 10
+  }
+}
+layer {
+  name: "conv8_2_mbox_loc_perm"
+  type: "Permute"
+  bottom: "conv8_2_mbox_loc"
+  top: "conv8_2_mbox_loc_perm"
+  permute_param {
+    order: 0
+    order: 2
+    order: 3
+    order: 1
+  }
+}
+layer {
+  name: "conv8_2_mbox_loc_flat"
+  type: "Flatten"
+  bottom: "conv8_2_mbox_loc_perm"
+  top: "conv8_2_mbox_loc_flat"
+  flatten_param {
+    axis: 1
+  }
+}
+layer {
+  name: "conv8_2_mbox_conf"
+  type: "Convolution"
+  bottom: "conv8_2"
+  top: "conv8_2_mbox_conf"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 84
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "conv8_2_mbox_conf_perm"
+  type: "Permute"
+  bottom: "conv8_2_mbox_conf"
+  top: "conv8_2_mbox_conf_perm"
+  permute_param {
+    order: 0
+    order: 2
+    order: 3
+    order: 1
+  }
+}
+layer {
+  name: "conv8_2_mbox_conf_flat"
+  type: "Flatten"
+  bottom: "conv8_2_mbox_conf_perm"
+  top: "conv8_2_mbox_conf_flat"
+  flatten_param {
+    axis: 1
+  }
+}
+layer {
+  name: "conv8_2_mbox_priorbox"
+  type: "PriorBox"
+  bottom: "conv8_2"
+  bottom: "data"
+  top: "conv8_2_mbox_priorbox"
+  prior_box_param {
+    min_size: 213
+    max_size: 264
+    aspect_ratio: 2
+    flip: true
+    clip: false
+    variance: 0.1
+    variance: 0.1
+    variance: 0.2
+    variance: 0.2
+    step: 100
+    offset: 0.5
+  }
+}
+layer {
+  name: "conv9_2_mbox_loc"
+  type: "Convolution"
+  bottom: "conv9_2"
+  top: "conv9_2_mbox_loc"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 16
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    fl_layer_in: 3
+    fl_layer_out: 6
+    fl_params: 10
+  }
+}
+layer {
+  name: "conv9_2_mbox_loc_perm"
+  type: "Permute"
+  bottom: "conv9_2_mbox_loc"
+  top: "conv9_2_mbox_loc_perm"
+  permute_param {
+    order: 0
+    order: 2
+    order: 3
+    order: 1
+  }
+}
+layer {
+  name: "conv9_2_mbox_loc_flat"
+  type: "Flatten"
+  bottom: "conv9_2_mbox_loc_perm"
+  top: "conv9_2_mbox_loc_flat"
+  flatten_param {
+    axis: 1
+  }
+}
+layer {
+  name: "conv9_2_mbox_conf"
+  type: "Convolution"
+  bottom: "conv9_2"
+  top: "conv9_2_mbox_conf"
+  param {
+    lr_mult: 1
+    decay_mult: 1
+  }
+  param {
+    lr_mult: 2
+    decay_mult: 0
+  }
+  convolution_param {
+    num_output: 84
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0
+    }
+  }
+}
+layer {
+  name: "conv9_2_mbox_conf_perm"
+  type: "Permute"
+  bottom: "conv9_2_mbox_conf"
+  top: "conv9_2_mbox_conf_perm"
+  permute_param {
+    order: 0
+    order: 2
+    order: 3
+    order: 1
+  }
+}
+layer {
+  name: "conv9_2_mbox_conf_flat"
+  type: "Flatten"
+  bottom: "conv9_2_mbox_conf_perm"
+  top: "conv9_2_mbox_conf_flat"
+  flatten_param {
+    axis: 1
+  }
+}
+layer {
+  name: "conv9_2_mbox_priorbox"
+  type: "PriorBox"
+  bottom: "conv9_2"
+  bottom: "data"
+  top: "conv9_2_mbox_priorbox"
+  prior_box_param {
+    min_size: 264
+    max_size: 315
+    aspect_ratio: 2
+    flip: true
+    clip: false
+    variance: 0.1
+    variance: 0.1
+    variance: 0.2
+    variance: 0.2
+    step: 300
+    offset: 0.5
+  }
+}
+layer {
+  name: "mbox_loc"
+  type: "Concat"
+  bottom: "conv4_3_norm_mbox_loc_flat"
+  bottom: "fc7_mbox_loc_flat"
+  bottom: "conv6_2_mbox_loc_flat"
+  bottom: "conv7_2_mbox_loc_flat"
+  bottom: "conv8_2_mbox_loc_flat"
+  bottom: "conv9_2_mbox_loc_flat"
+  top: "mbox_loc"
+  concat_param {
+    axis: 1
+  }
+}
+layer {
+  name: "mbox_conf"
+  type: "Concat"
+  bottom: "conv4_3_norm_mbox_conf_flat"
+  bottom: "fc7_mbox_conf_flat"
+  bottom: "conv6_2_mbox_conf_flat"
+  bottom: "conv7_2_mbox_conf_flat"
+  bottom: "conv8_2_mbox_conf_flat"
+  bottom: "conv9_2_mbox_conf_flat"
+  top: "mbox_conf"
+  concat_param {
+    axis: 1
+  }
+}
+layer {
+  name: "mbox_priorbox"
+  type: "Concat"
+  bottom: "conv4_3_norm_mbox_priorbox"
+  bottom: "fc7_mbox_priorbox"
+  bottom: "conv6_2_mbox_priorbox"
+  bottom: "conv7_2_mbox_priorbox"
+  bottom: "conv8_2_mbox_priorbox"
+  bottom: "conv9_2_mbox_priorbox"
+  top: "mbox_priorbox"
+  concat_param {
+    axis: 2
+  }
+}
+layer {
+  name: "mbox_conf_reshape"
+  type: "Reshape"
+  bottom: "mbox_conf"
+  top: "mbox_conf_reshape"
+  reshape_param {
+    shape {
+      dim: 0
+      dim: -1
+      dim: 21
+    }    
+  }
+}
+layer {
+  name: "mbox_conf_softmax"
+  type: "Softmax"
+  bottom: "mbox_conf_reshape"
+  top: "mbox_conf_softmax"
+  softmax_param {
+    axis: 2
+  }
+}
+layer {
+  name: "mbox_conf_flatten"
+  type: "Flatten"
+  bottom: "mbox_conf_softmax"
+  top: "mbox_conf_flatten"
+  flatten_param {
+    axis: 1
+  }
+}
+layer {
+  name: "detection_out"
+  type: "DetectionOutput"
+  bottom: "mbox_loc"
+  bottom: "mbox_conf_flatten"
+  bottom: "mbox_priorbox"
+  top: "detection_out"
+  include {
+    phase: TEST
+  }
+  detection_output_param {
+    num_classes: 21
+    share_location: true
+    background_label_id: 0
+    nms_param {
+      nms_threshold: 0.45
+      top_k: 400
+    }
+    code_type: CENTER_SIZE
+    keep_top_k: 200
+    confidence_threshold: 0.01
+  }
+}
diff --git a/src/caffe/layers/mkldnn_concat_layer.cpp b/src/caffe/layers/mkldnn_concat_layer.cpp
index 7da1fb8c8..3f86c2f75 100644
--- a/src/caffe/layers/mkldnn_concat_layer.cpp
+++ b/src/caffe/layers/mkldnn_concat_layer.cpp
@@ -273,7 +273,8 @@ void MKLDNNConcatLayer<Dtype>::InitConcatFwd(const vector<Blob<Dtype>*>& bottom,
   }
 
   engine cpu_engine = CpuEngine::Instance().get_engine();
-  memory::data_type data_type = memory::data_type::f32;
+  memory::data_type usr_dt = memory::data_type::f32;
+  memory::data_type prv_dt = usr_dt;
   // memory::format mfmt_any = memory::format::any;
   memory::format mfmt_nchw = memory::format::nchw;
 
@@ -284,6 +285,25 @@ void MKLDNNConcatLayer<Dtype>::InitConcatFwd(const vector<Blob<Dtype>*>& bottom,
   fwd_bottom_data.clear();
   fwd_input_primitives_.clear();
   fwd_input_primitives_at_.clear();
+
+  int fl = 0;
+  int fl_min = 0;
+  float scale = 1.;
+  float scale_min = 1.;
+  for (auto i = 0; i < num_concats_; i++) {
+      if (const_cast<Dtype*>(bottom[i]->prv_data()) != NULL) {
+          shared_ptr<MKLDNNMemoryDescriptor<Dtype, false> > mem_descr
+            = get_mkldnn_prv_descriptor<Dtype, false>(bottom[i]);
+          fl = mem_descr->get_fl(0);
+          if (fl_min == 0) fl_min = fl;
+          if(fl != 0 && fl < fl_min) fl_min = fl;
+          scale = mem_descr->get_scale(0);
+          if (scale_min == 1.) scale_min = scale;
+          if(scale != 1. && scale < scale_min) scale_min = scale;
+      }
+  }
+  
+  bool bottom_is_float = false;
   for (auto i = 0; i < num_concats_; i++) {
     fwd_bottom_data.push_back(boost::shared_ptr<MKLDNNData<Dtype> >());
 
@@ -308,37 +328,63 @@ void MKLDNNConcatLayer<Dtype>::InitConcatFwd(const vector<Blob<Dtype>*>& bottom,
     memory::format src_mfmt = mfmt_nchw;
     shared_ptr<memory::primitive_desc> prv_src_mpd;
     shared_ptr<memory::primitive_desc> usr_src_mpd(
-        new memory::primitive_desc({input_tz, data_type, mfmt_nchw}, cpu_engine));
-
+        new memory::primitive_desc({input_tz, usr_dt, mfmt_nchw}, cpu_engine));
+ 
     if (const_cast<Dtype*>(bottom[i]->prv_data()) != NULL) {
+      fl = 0;
+      scale = 1.;
       shared_ptr<MKLDNNMemoryDescriptor<Dtype, false> > mem_descr
         = get_mkldnn_prv_descriptor<Dtype, false>(bottom[i]);
+      bottom_is_float = mem_descr->get_float();
       src_mfmt = static_cast<memory::format>(
           mem_descr->prv_memory_pd()->desc().data.format);
+      prv_dt = static_cast<memory::data_type>(mem_descr->prv_memory_pd()->desc().data.data_type);
       prv_src_mpd.reset(new memory::primitive_desc(
-            {input_tz, data_type, src_mfmt}, cpu_engine));
+            {input_tz, prv_dt, src_mfmt}, cpu_engine));
+      fl = mem_descr->get_fl(0);
+      if(fl != 0) fl = fl_min;
+      scale = mem_descr->get_scale(0);
+      if(scale != 1.) scale = scale_min;
     }
+    std::vector<int> fl_bottom;
+    fl_bottom.push_back(fl);
+    std::vector<float> scale_bottom;
+    scale_bottom.push_back(scale);
 
     srcs_mpd.push_back(memory::primitive_desc(
-          {input_tz, data_type, src_mfmt}, cpu_engine));
-
-    fwd_bottom_data[i].reset(new MKLDNNData<Dtype>(
-          usr_src_mpd, prv_src_mpd, bottom[i], this));
-
+          {input_tz, prv_dt, src_mfmt}, cpu_engine));
+
+    if(bottom_is_float){
+        fwd_bottom_data[i].reset(new MKLDNNData<Dtype>(
+              usr_src_mpd, prv_src_mpd, bottom[i], this, true, scale_bottom));
+    } else{
+        fwd_bottom_data[i].reset(new MKLDNNData<Dtype>(
+              usr_src_mpd, prv_src_mpd, bottom[i], this, fl_bottom));
+    }
     fwd_input_primitives_.push_back(fwd_bottom_data[i]->create_input(false));
     fwd_input_primitives_at_.push_back(*fwd_input_primitives_[i]);
   }
 
   shared_ptr<memory::primitive_desc> usr_dst_mpd(new memory::primitive_desc(
-        {output_tz, data_type, mfmt_nchw}, cpu_engine));
+        {output_tz, usr_dt, mfmt_nchw}, cpu_engine));
 
   concatFwd_pd.reset(new concat::primitive_desc(concat_dimension, srcs_mpd));
 
   shared_ptr<memory::primitive_desc> prv_dst_mpd(new memory::primitive_desc(
         concatFwd_pd->dst_primitive_desc()));
 
-  fwd_top_data.reset(new MKLDNNData<Dtype>(usr_dst_mpd, prv_dst_mpd, top[0],
-        this));
+  std::vector<int> fl_top;
+  fl_top.push_back(fl_min);
+  std::vector<float> scale_top;
+  scale_top.push_back(scale_min);
+  if(bottom_is_float){
+      fwd_top_data.reset(new MKLDNNData<Dtype>(usr_dst_mpd, prv_dst_mpd, top[0],
+            this, true, scale_top));
+  } else{
+      fwd_top_data.reset(new MKLDNNData<Dtype>(usr_dst_mpd, prv_dst_mpd, top[0],
+          this, fl_top));
+  }
+
   fwd_output_memory = fwd_top_data->create_output_memory();
 
   concatFwd.reset(new concat(*concatFwd_pd, fwd_input_primitives_at_, *fwd_output_memory));
diff --git a/src/caffe/layers/mkldnn_convolution_layer.cpp b/src/caffe/layers/mkldnn_convolution_layer.cpp
index 991b32eb7..9380afe32 100644
--- a/src/caffe/layers/mkldnn_convolution_layer.cpp
+++ b/src/caffe/layers/mkldnn_convolution_layer.cpp
@@ -52,7 +52,7 @@ namespace caffe {
 
 template <typename Dtype>
 MKLDNNConvolutionLayer<Dtype>::MKLDNNConvolutionLayer(const LayerParameter& param)
-            : MKLDNNLayer<Dtype>(), ConvolutionLayer<Dtype>(param)
+            : MKLDNNLayer<Dtype>(param), ConvolutionLayer<Dtype>(param)
             , fwd_bottom_data(NULL), fwd_top_data(NULL), fwd_weights_data(NULL), fwd_bias_data(NULL)
             , bwdd_weights_data(NULL), bwdw_bottom_data(NULL)
             , bwdd_bottom_diff(NULL), bwdd_top_diff(NULL)
@@ -99,6 +99,7 @@ void MKLDNNConvolutionLayer<Dtype>::init_properties(const vector<Blob<Dtype>*>&
     this->pad_h_ = this->pad_.cpu_data()[0];
     this->kernel_w_ = this->kernel_shape_.cpu_data()[1];
     this->kernel_h_  = this->kernel_shape_.cpu_data()[0];
+
     string _conv_algorithm = this->layer_param_.convolution_param().conv_algorithm();
     if(_conv_algorithm == "direct")
     {
@@ -120,6 +121,8 @@ void MKLDNNConvolutionLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& botto
                                             , const vector<Blob<Dtype>*>& top)
 {
     VLOG(1) << "<< MKLDNNConvolutionLayer<Dtype>::LayerSetUp: " << this->layer_param_.name();
+    if (this->layer_param_.has_quantization_param() && this->phase_ == TEST) this->need_quantize_ = true;
+
     ConvolutionLayer<Dtype>::LayerSetUp(bottom, top);
     init_properties(bottom, top);
     this->bottom_shape_ = &bottom[0]->shape();
@@ -145,7 +148,6 @@ void MKLDNNConvolutionLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom
                      this->num_ == bottom[0]->num()) ? false : true;
     init_properties(bottom, top);
     BaseConvolutionLayer<Dtype>::ReshapeForMKL(bottom, top);
-
 #ifndef DISABLE_CONV_SUM_FUSION
     if (bottom.size() > 1) {
         top[0]->ShareData(*bottom[1]);
@@ -185,6 +187,40 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionFwd(const vector<Blob<Dtype>*
 
     // ---- Initialize memory descriptors (fromat = any) to create convolution descriptor -------------
     memory::data_type mpcsn = memory::data_type::f32;
+    memory::data_type bottom_dt = this->need_quantize_ ? memory::data_type::u8 : memory::data_type::f32;
+    memory::data_type top_dt = memory::data_type::f32;
+
+    if (this->need_quantize_) {
+      if (this->bw_layer_out_ == 8) {
+        if (relu) {
+          top_dt = memory::data_type::u8;
+        }
+        else {
+          top_dt = memory::data_type::s8;
+        }
+      }
+      else {
+        top_dt = memory::data_type::s32;
+      }
+    }
+
+    bool is_sum;
+    if (bottom.size() > 1) {
+      is_sum = true;
+      shared_ptr<MKLDNNMemoryDescriptor<Dtype, false> > bottom_0_desc =
+          get_mkldnn_prv_descriptor<Dtype, false>(bottom[0]);
+
+      shared_ptr<MKLDNNMemoryDescriptor<Dtype, false> > bottom_1_desc =
+          get_mkldnn_prv_descriptor<Dtype, false>(bottom[1]);
+
+      if (top_dt != bottom_1_desc->prv_memory_pd()->desc().data.data_type) {
+        top_dt = static_cast<memory::data_type>(
+            bottom_1_desc->prv_memory_pd()->desc().data.data_type);
+      }
+    }
+
+    memory::data_type weights_dt = this->need_quantize_ ? memory::data_type::s8 : memory::data_type::f32;
+    memory::data_type bias_dt = this->need_quantize_ ? memory::data_type::s32 : memory::data_type::f32;
     memory::format mfmt_any = memory::format::any;
 
     memory::dims bottom_tz = {n, ic, ih, iw};
@@ -193,11 +229,31 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionFwd(const vector<Blob<Dtype>*
     memory::dims weights_tz = (g!= 1) ? memory::dims{g, oc/g, ic/g, kh, kw} : memory::dims{oc, ic, kh, kw};
 
     // ---- Memory descriptors for initializing of convolution primitive descriptor -------------
-    memory::desc init_bottom_md({bottom_tz}, mpcsn, mfmt_any);
-    memory::desc init_bias_md({bias_tz}, mpcsn, mfmt_any);
-    memory::desc init_top_md({top_tz}, mpcsn, mfmt_any);
-    memory::desc init_weights_md({weights_tz}, mpcsn, mfmt_any);
-
+    memory::desc init_bottom_md({bottom_tz}, bottom_dt, mfmt_any);
+    memory::desc init_bias_md({bias_tz}, bias_dt, mfmt_any);
+    memory::desc init_top_md({top_tz}, top_dt, mfmt_any);
+    memory::desc init_weights_md({weights_tz}, weights_dt, mfmt_any);
+
+    primitive_attr attr;
+    if (this->need_quantize_) {
+      if(this->scale_in_.size() > 0) this->is_float_ = true;
+      int mask = 0;
+      std::vector<float> scales;
+      int count = 1; // 1 for single channel, oc for multi channel
+      for(int i=0; i<count; i++){
+          float scale;
+          if(this->is_float_){
+              scale = this->scale_out_[0] / (this->scale_in_[0] * this->scale_params_[i]);
+          } else{
+              int output_shift = this->fl_layer_out_[0] - this->fl_layer_in_[0] - this->fl_params_[i];
+              scale = pow(2. ,output_shift);
+          }
+          scales.push_back(scale);
+      }
+      attr.set_output_scales(mask,scales);
+      attr.set_int_output_round_mode(round_nearest);
+    }
+    
     // ---- Determining engine to use -----------------------
     std::string subengines = this->layer_param_.engine();
     if (subengines == "" || subengines == "MKLDNN")
@@ -206,7 +262,6 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionFwd(const vector<Blob<Dtype>*
     unsigned subEngineIndex = 0;
     mkldnn::algorithm eligibleAlgorithms[2] = {conv_algorithm, algorithm::convolution_direct};
     convFwd_pd = NULL;
-    mkldnn::primitive_attr attr;
     mkldnn::post_ops ops;
 
 #ifndef DISABLE_CONV_SUM_FUSION
@@ -214,13 +269,27 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionFwd(const vector<Blob<Dtype>*
 #else
     if(relu) {
 #endif
-        float scale = 1.0f; //for fp32, scale is 1.
+        float scale = 1.0f;
         Dtype alpha = negative_slope;  // negative slope for mkldnn_eltwise_relu.
         float beta = 1.0f;  //ignored for mkldnn_eltwise_relu.
 #ifndef DISABLE_CONV_SUM_FUSION
-    if (bottom.size() > 1) {
-        ops.append_sum(1.0f);
-    }
+        if (bottom.size() > 1) {
+          if (this->need_quantize_) {
+            float sum_scale;
+            if(this->is_float_){
+                sum_scale = this->scale_out_[0] /
+                      get_mkldnn_prv_descriptor<Dtype, false>(bottom[1])->get_scale(0);
+            } else{
+                int sum_shift =
+                    this->fl_layer_out_[0] -
+                    get_mkldnn_prv_descriptor<Dtype, false>(bottom[1])->get_fl(0);          
+                sum_scale = pow(2., sum_shift);
+            } 
+            ops.append_sum(sum_scale);
+          } else {
+            ops.append_sum(1.0f);
+          }
+        }
 #endif
         ops.append_eltwise(scale, eltwise_relu, alpha, beta);
         attr.set_post_ops(ops);
@@ -245,7 +314,7 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionFwd(const vector<Blob<Dtype>*
            subEngineIndex++) {
         try {
 #ifndef DISABLE_CONV_SUM_FUSION
-            if(relu || bottom.size() > 1) {
+            if(this->need_quantize_ || relu || bottom.size() > 1) {
 #else
             if(relu) {
 #endif
@@ -275,36 +344,110 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionFwd(const vector<Blob<Dtype>*
     shared_ptr<MemPD> prv_fwd_top_data_memory_pd(new MemPD(convFwd_pd->dst_primitive_desc()));
     shared_ptr<MemPD> prv_fwd_weights_data_memory_pd(new MemPD(convFwd_pd->weights_primitive_desc()));
 
+    // ---- Log prv memory primitive descriptors -------------
+    info_mem_pd<Dtype>(prv_fwd_bottom_data_memory_pd, "conv_src:" + this->layer_param_.name());
+    info_mem_pd<Dtype>(prv_fwd_top_data_memory_pd, "conv_dst:" + this->layer_param_.name());
+    
     // ---- Create usr memory primitive descriptors -------------
     memory::format mfmt_nchw = memory::format::nchw;
     memory::format weights_mfmt = (g!= 1) ? memory::format::goihw : memory::format::oihw;
 
     // TODO: There should not be a problem to use this for Backward as well
+    
     shared_ptr<MemPD> usr_bottom_data_memory_pd(new MemPD({{bottom_tz}, mpcsn, mfmt_nchw}, cpu_engine));
     shared_ptr<MemPD> usr_bias_data_memory_pd(new MemPD({{bias_tz}, mpcsn, memory::format::x}, cpu_engine));
     shared_ptr<MemPD> usr_top_data_memory_pd(new MemPD({{top_tz}, mpcsn, mfmt_nchw}, cpu_engine));
     shared_ptr<MemPD> usr_weights_data_memory_pd(new MemPD({{weights_tz}, mpcsn, weights_mfmt}, cpu_engine));
 
-
     // ---  init primitive and prv_memory descriptors ----------------------
-    fwd_bottom_data.reset(new MKLDNNData<Dtype>(usr_bottom_data_memory_pd, prv_fwd_bottom_data_memory_pd, bottom[0], this));
-    fwd_bottom_data ->name = "fwd_bottom_data   @ " + this->layer_param_.name();
+    bool bottom_is_float = false;
+    if (const_cast<Dtype*>(bottom[0]->prv_data()) != NULL) {
+        shared_ptr<MKLDNNMemoryDescriptor<Dtype, false> > blob_prv_mkldnn_mem_descr = get_mkldnn_prv_descriptor<Dtype, false>(bottom[0]);
+        bottom_is_float = blob_prv_mkldnn_mem_descr->get_float();
+    }
+    if (this->need_quantize_){
+      if(this->is_float_ || bottom_is_float){
+        std::vector<float> scale_bottom;
+        scale_bottom.push_back(this->scale_in_[0]);
+        fwd_bottom_data.reset(new MKLDNNData<Dtype>(usr_bottom_data_memory_pd, prv_fwd_bottom_data_memory_pd, bottom[0], this, true, scale_bottom));
+      } else{
+        std::vector<int> fl_bottom;
+        fl_bottom.push_back(this->fl_layer_in_[0]);
+        fwd_bottom_data.reset(new MKLDNNData<Dtype>(usr_bottom_data_memory_pd, prv_fwd_bottom_data_memory_pd, bottom[0], this, fl_bottom));
+      }       
+    } else if(bottom_is_float){
+      fwd_bottom_data.reset(new MKLDNNData<Dtype>(usr_bottom_data_memory_pd, prv_fwd_bottom_data_memory_pd, bottom[0], this, false));
+    } else{
+      fwd_bottom_data.reset(new MKLDNNData<Dtype>(usr_bottom_data_memory_pd, prv_fwd_bottom_data_memory_pd, bottom[0], this));
+    }
+    fwd_bottom_data->name = "fwd_bottom_data   @ " + this->layer_param_.name();
     fwd_bottom_data_primitive = fwd_bottom_data->create_input(false);
 
-    fwd_top_data.reset(new MKLDNNData<Dtype>(usr_top_data_memory_pd, prv_fwd_top_data_memory_pd, top[0], this));
-    fwd_top_data    ->name = "fwd_top_data      @ " + this->layer_param_.name();
+    if (this->need_quantize_){
+      if(this->is_float_ || bottom_is_float){
+        std::vector<float> scale_top;
+        scale_top.push_back(this->scale_out_[0]);
+        fwd_top_data.reset(new MKLDNNData<Dtype>(usr_top_data_memory_pd, prv_fwd_top_data_memory_pd, top[0], this, true, scale_top, is_sum));
+      } else{
+        std::vector<int> fl_top;
+        fl_top.push_back(this->fl_layer_out_[0]);
+        fwd_top_data.reset(new MKLDNNData<Dtype>(usr_top_data_memory_pd, prv_fwd_top_data_memory_pd, top[0], this, fl_top, is_sum));
+      }
+    } else if(bottom_is_float){ 
+      fwd_top_data.reset(new MKLDNNData<Dtype>(usr_top_data_memory_pd, prv_fwd_top_data_memory_pd, top[0], this, false));
+    } else{
+      fwd_top_data.reset(new MKLDNNData<Dtype>(usr_top_data_memory_pd, prv_fwd_top_data_memory_pd, top[0], this));
+    }
+    fwd_top_data->name = "fwd_top_data      @ " + this->layer_param_.name();
     fwd_top_data_memory = fwd_top_data->create_output_memory();
 
-    fwd_weights_data.reset(new MKLDNNData<Dtype>(usr_weights_data_memory_pd, prv_fwd_weights_data_memory_pd, this->blobs_[0].get(), this));
+    if (this->need_quantize_){
+      int count = 1; // 1 for single channel, oc for multi channel
+      if(this->is_float_ || bottom_is_float){
+        std::vector<float> scale_weight;
+        for(int i=0; i<count; i++){
+          scale_weight.push_back(this->scale_params_[i]);
+        }
+        fwd_weights_data.reset(new MKLDNNData<Dtype>(usr_weights_data_memory_pd, prv_fwd_weights_data_memory_pd, this->blobs_[0].get(), this, true, scale_weight));
+      } else{
+        std::vector<int> fl_weight;
+        for(int i=0; i<count; i++){
+          fl_weight.push_back(this->fl_params_[i]);
+        }
+        fwd_weights_data.reset(new MKLDNNData<Dtype>(usr_weights_data_memory_pd, prv_fwd_weights_data_memory_pd, this->blobs_[0].get(), this, fl_weight));
+      }
+    } else if(bottom_is_float){
+      fwd_weights_data.reset(new MKLDNNData<Dtype>(usr_weights_data_memory_pd, prv_fwd_weights_data_memory_pd, this->blobs_[0].get(), this, false));
+    } else{
+      fwd_weights_data.reset(new MKLDNNData<Dtype>(usr_weights_data_memory_pd, prv_fwd_weights_data_memory_pd, this->blobs_[0].get(), this));
+    }
     fwd_weights_data->name = "fwd_weights_data  @ " + this->layer_param_.name();
     fwd_weights_data_primitive = fwd_weights_data->create_input(true);
 
     if (this->bias_term_) {
         shared_ptr<MemPD> prv_fwd_bias_data_memory_pd(new MemPD(convFwd_pd->bias_primitive_desc()));
-        fwd_bias_data.reset(new MKLDNNData<Dtype>(usr_bias_data_memory_pd, prv_fwd_bias_data_memory_pd, this->blobs_[1].get(), this));
+        if (this->need_quantize_){
+          int count = 1; // 1 for single channel, oc for multi channel
+          if(this->is_float_ || bottom_is_float){
+            std::vector<float> scale_bias;
+            for(int i=0; i<count; i++){
+              scale_bias.push_back(this->scale_in_[0] * this->scale_params_[i]);
+            }
+            fwd_bias_data.reset(new MKLDNNData<Dtype>(usr_bias_data_memory_pd, prv_fwd_bias_data_memory_pd, this->blobs_[1].get(), this, true, scale_bias));
+          } else{
+            std::vector<int> fl_bias;
+            for(int i=0; i<count; i++){
+              fl_bias.push_back(this->fl_layer_in_[0] + this->fl_params_[i]);
+            }
+            fwd_bias_data.reset(new MKLDNNData<Dtype>(usr_bias_data_memory_pd, prv_fwd_bias_data_memory_pd, this->blobs_[1].get(), this, fl_bias));
+          }
+        } else if(bottom_is_float){
+          fwd_bias_data.reset(new MKLDNNData<Dtype>(usr_bias_data_memory_pd, prv_fwd_bias_data_memory_pd, this->blobs_[1].get(), this, false));
+        } else{
+          fwd_bias_data.reset(new MKLDNNData<Dtype>(usr_bias_data_memory_pd, prv_fwd_bias_data_memory_pd, this->blobs_[1].get(), this));
+        }
         fwd_bias_data->name = "fwd_bias_data     @ " + this->layer_param_.name();
         fwd_bias_data_primitive = fwd_bias_data->create_input(true);
-
         convFwd.reset(new convolution_forward(*convFwd_pd
                         , *fwd_bottom_data_primitive, *fwd_weights_data_primitive
                         , *fwd_bias_data_primitive, *fwd_top_data_memory));
@@ -336,6 +479,7 @@ void MKLDNNConvolutionLayer<Dtype>::Forward_cpu(const vector<Blob<Dtype>*>& bott
                                                 , const vector<Blob<Dtype>*>& top)
 {
     VLOG(1) << "MKLDNNConvolutionLayer<Dtype>::Forward_cpu: " << this->layer_param_.name();
+
     if( convFwd_pd == NULL || this->reshape)
         InitConvolutionFwd(bottom, top);
     // making reorders if needed.
@@ -549,7 +693,6 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionBwd(const vector<Blob<Dtype>*
     MKLDNNPrimitive<Dtype> bwdd_weights_data_primitive_transfer(bwdd_weights_data_primitive);
     bwdd_weights_data->set_mkldnn_primitive(bwdd_weights_data_primitive_transfer);
 
-
     //bwdw_bottom_data->set_mkldnn_primitive(convBwdWeights);   //Wrong passed primitive! (TODO: Checking!)
     MKLDNNPrimitive<Dtype> bwdw_bottom_data_primitive_transfer(bwdw_bottom_data_primitive);
     bwdw_bottom_data->set_mkldnn_primitive(bwdw_bottom_data_primitive_transfer);
diff --git a/src/caffe/layers/mkldnn_eltwise_layer.cpp b/src/caffe/layers/mkldnn_eltwise_layer.cpp
index ba47f1fa5..ec4bc08f2 100644
--- a/src/caffe/layers/mkldnn_eltwise_layer.cpp
+++ b/src/caffe/layers/mkldnn_eltwise_layer.cpp
@@ -147,8 +147,6 @@ void MKLDNNEltwiseLayer<Dtype>::InitEltwiseFwd(const vector<Blob<Dtype>*>& botto
     memory::format mfmt_nchw = memory::format::nchw;
 
     // ---- Initialize memory descriptors -------------
-    shared_ptr<memory::desc> bottom_data_md, top_data_md;
-
     std::vector<memory::primitive_desc> bottom_data_mpd;
     fwd_bottom_data.clear();
     fwd_bottom_data_primitives_.clear();
@@ -168,15 +166,9 @@ void MKLDNNEltwiseLayer<Dtype>::InitEltwiseFwd(const vector<Blob<Dtype>*>& botto
                 = get_mkldnn_prv_descriptor<Dtype, false>(bottom[i]);
             bottom_data_mfmt = static_cast<memory::format>(
                 mem_descr->prv_memory_pd()->desc().data.format);
-            bottom_data_md.reset(new memory::desc(mem_descr->prv_memory_pd()->desc()));
             prv_bottom_data_mpd.reset(new memory::primitive_desc(
                 {{n, ic, ih, iw}, mpcsn, bottom_data_mfmt}, cpu_engine));
         }
-        else
-        {
-            bottom_data_md.reset(new memory::desc({{n, ic, ih, iw}}, mpcsn, bottom_data_mfmt));
-        }
-        top_data_md = bottom_data_md;
 
         bottom_data_mpd.push_back(memory::primitive_desc(
             {{n, ic, ih, iw}, mpcsn, bottom_data_mfmt}, cpu_engine));
diff --git a/src/caffe/layers/mkldnn_inner_product_layer.cpp b/src/caffe/layers/mkldnn_inner_product_layer.cpp
index 7c48547b6..9994df789 100644
--- a/src/caffe/layers/mkldnn_inner_product_layer.cpp
+++ b/src/caffe/layers/mkldnn_inner_product_layer.cpp
@@ -56,7 +56,7 @@ namespace caffe {
 template <typename Dtype>
 MKLDNNInnerProductLayer<Dtype>::MKLDNNInnerProductLayer(
             const LayerParameter& param) :
-            MKLDNNLayer<Dtype>(),
+            MKLDNNLayer<Dtype>(param),
             InnerProductLayer<Dtype>(param),
             fwd_bottom_data(NULL),
             fwd_top_data(NULL),
diff --git a/src/caffe/layers/mkldnn_lrn_layer.cpp b/src/caffe/layers/mkldnn_lrn_layer.cpp
index 41c0f45b6..d3c3147fd 100644
--- a/src/caffe/layers/mkldnn_lrn_layer.cpp
+++ b/src/caffe/layers/mkldnn_lrn_layer.cpp
@@ -46,7 +46,7 @@ namespace caffe {
 
 template <typename Dtype>
 MKLDNNLRNLayer<Dtype>::MKLDNNLRNLayer(const LayerParameter& param)
-        : MKLDNNLayer<Dtype>(), Layer<Dtype>(param)
+        : MKLDNNLayer<Dtype>(param), Layer<Dtype>(param)
         , fwd_top_data(NULL), fwd_bottom_data(NULL)
         , bwd_top_diff(NULL), bwd_bottom_diff(NULL)
         , lrnFwd_pd(NULL), lrnBwd_pd(NULL)
@@ -140,21 +140,24 @@ void MKLDNNLRNLayer<Dtype>::InitLRNFwd(const vector<Blob<Dtype>*>& bottom, const
 
     engine cpu_engine = CpuEngine::Instance().get_engine();
     memory::data_type mpcsn = memory::data_type::f32;
-    // ---- Initialize memory descriptors -------------
     memory::dims tz = {n, ic, ih, iw};
-    shared_ptr<memory::desc> top_md;
-    shared_ptr<memory::primitive_desc> usr_mpd, prv_mpd;
+    memory::format mfmt_nchw = memory::format::nchw;
+    memory::format cmfmt = mfmt_nchw;
+
+    // ---- Initialize memory descriptors -------------
+    typedef typename memory::primitive_desc MemPD; // short name for memory::primitive_desc
+
+    // ---- Create usr memory primitive descriptors -------------
+    shared_ptr<MemPD> usr_data_memory_pd(new MemPD({{tz}, mpcsn, mfmt_nchw}, cpu_engine));
+
+    // ---- Create prv memory descriptors -------------------
     if (bottom_data_is_prv) {
         shared_ptr<MKLDNNMemoryDescriptor<Dtype, false> > mem_descr
             = get_mkldnn_prv_descriptor<Dtype, false>(bottom[0]);
-        bottom_md.reset(new memory::desc(mem_descr->prv_memory_pd()->desc()));
-        usr_mpd = mem_descr->usr_memory_pd();
-        prv_mpd = mem_descr->prv_memory_pd();
-    } else {
-        bottom_md.reset(new memory::desc({tz}, mpcsn, memory::format::nchw));
-        usr_mpd.reset(new memory::primitive_desc(*bottom_md, cpu_engine));
+        cmfmt = static_cast<memory::format>(mem_descr->prv_memory_pd()->desc().data.format);
     }
-    top_md = bottom_md;
+
+    bottom_md.reset(new memory::desc({tz}, mpcsn, cmfmt));
 
     // ---- Initialize LRN primitive descriptor -------------
     lrn_forward::desc lrnFwd_desc(propagation, lrn_algorithm, *bottom_md,
@@ -179,20 +182,15 @@ void MKLDNNLRNLayer<Dtype>::InitLRNFwd(const vector<Blob<Dtype>*>& bottom, const
 
     CHECK(lrnFwd_pd);
     // ---- Create priv memory primitive descriptors stored as class members -------------
-    typedef typename memory::primitive_desc MemPD; // short name for memory::primitive_desc
     shared_ptr<MemPD> prv_fwd_bottom_data_memory_pd(new MemPD(lrnFwd_pd->src_primitive_desc()));
     shared_ptr<MemPD> prv_fwd_top_data_memory_pd(new MemPD(lrnFwd_pd->dst_primitive_desc()));
-
-    // ---- Create usr memory primitive descriptors -------------
-    memory::format mfmt_nchw = memory::format::nchw;
-
-    shared_ptr<MemPD> usr_data_memory_pd(new MemPD({{tz}, mpcsn, mfmt_nchw}, cpu_engine));
+    shared_ptr<MemPD> prv_memory_pd(new MemPD(lrnFwd_pd->dst_primitive_desc()));
 
     // ---  init primitive and prv_memory descriptors ----------------------
     fwd_bottom_data.reset(new MKLDNNData<Dtype>(usr_data_memory_pd, prv_fwd_bottom_data_memory_pd, bottom[0], this));
     fwd_bottom_data->name = "fwd_bottom_data   @ " + this->layer_param_.name();
     fwd_bottom_data_primitive = fwd_bottom_data->create_input(false);
-    fwd_top_data.reset(new MKLDNNData<Dtype>(usr_mpd, prv_fwd_top_data_memory_pd, top[0], this));
+    fwd_top_data.reset(new MKLDNNData<Dtype>(usr_data_memory_pd, prv_fwd_top_data_memory_pd, top[0], this));
     fwd_top_data->name = "fwd_top_data   @ " + this->layer_param_.name();
     fwd_top_data_memory = fwd_top_data->create_output_memory();
 
@@ -220,6 +218,7 @@ void MKLDNNLRNLayer<Dtype>::Forward_cpu(const vector<Blob<Dtype>*>& bottom
     VLOG(1) << "MKLDNNLRNLayer<Dtype>::Forward_cpu: " << this->layer_param_.name();
     if( lrnFwd_pd == NULL || this->reshape)
         InitLRNFwd(bottom, top);
+
     // making reorders if needed.
     fwd_bottom_data->sync_before_read();
     // update top that head at prv
diff --git a/src/caffe/layers/mkldnn_pooling_layer.cpp b/src/caffe/layers/mkldnn_pooling_layer.cpp
index 239ee66af..c672dd889 100644
--- a/src/caffe/layers/mkldnn_pooling_layer.cpp
+++ b/src/caffe/layers/mkldnn_pooling_layer.cpp
@@ -276,12 +276,19 @@ void MKLDNNPoolingLayer<Dtype>::InitPoolingFwd(const vector<Blob<Dtype>*>& botto
     shared_ptr<MemPD> usr_bottom_data_mpd(new MemPD({{bottom_tz}, mpcsn, mfmt_nchw}, cpu_engine));
     shared_ptr<MemPD> usr_top_data_mpd(new MemPD({{top_tz}, mpcsn, mfmt_nchw}, cpu_engine));
 
+    std::vector<int> fl;
+    std::vector<float> scale;
+    bool bottom_is_float = false;
     if (bottom_data_is_prv) {
         shared_ptr<MKLDNNMemoryDescriptor<Dtype, false> > mem_descr
             = get_mkldnn_prv_descriptor<Dtype, false>(bottom[0]);
+        bottom_is_float = mem_descr->get_float();
         cmfmt = static_cast<memory::format>(mem_descr->prv_memory_pd()->desc().data.format);
         mpcsn = static_cast<memory::data_type>(mem_descr->prv_memory_pd()->desc().data.data_type);
+        fl.push_back(mem_descr->get_fl(0));
+        scale.push_back(mem_descr->get_scale(0));
     }
+
     shared_ptr<memory::desc> init_fwd_bottom_md(new memory::desc({bottom_tz}, mpcsn, cmfmt));
     shared_ptr<memory::desc> init_fwd_top_md(new memory::desc({top_tz}, mpcsn, cmfmt));
 
@@ -315,9 +322,12 @@ void MKLDNNPoolingLayer<Dtype>::InitPoolingFwd(const vector<Blob<Dtype>*>& botto
     if (bottom_data_is_prv) {
         prv_fwd_bottom_data_mpd.reset(new MemPD(*init_fwd_bottom_md, engine));
         prv_fwd_top_data_mpd.reset(new MemPD(*init_fwd_top_md, engine));
+        // ---- Log prv memory primitive descriptors -------------
+        info_mem_pd<Dtype>(prv_fwd_bottom_data_mpd, "pooling_src:" + this->layer_param_.name());
+        info_mem_pd<Dtype>(prv_fwd_top_data_mpd, "pooling_dst:" + this->layer_param_.name());
     }
 
-    // ---- Create prv memory  ---------------------
+    // ---- Create priv memory  ---------------------
 
     // We'll output the mask to top[1] if it's of size >1.
     uint32_t* mask = NULL;  // suppress warnings about uninitalized variables
@@ -327,10 +337,18 @@ void MKLDNNPoolingLayer<Dtype>::InitPoolingFwd(const vector<Blob<Dtype>*>& botto
             : max_idx_.mutable_cpu_data();
 
     // ---  init primitive and prv_memory descriptors ----------------------
-    fwd_bottom_data.reset(new MKLDNNData<Dtype>(usr_bottom_data_mpd, prv_fwd_bottom_data_mpd, bottom[0], this));
+    if(bottom_is_float){
+        fwd_bottom_data.reset(new MKLDNNData<Dtype>(usr_bottom_data_mpd, prv_fwd_bottom_data_mpd, bottom[0], this, true, scale));
+    } else {
+        fwd_bottom_data.reset(new MKLDNNData<Dtype>(usr_bottom_data_mpd, prv_fwd_bottom_data_mpd, bottom[0], this, fl));
+    }
     fwd_bottom_data_primitive = fwd_bottom_data->create_input(false);
 
-    fwd_top_data.reset(new MKLDNNData<Dtype>(usr_top_data_mpd, prv_fwd_top_data_mpd, top[0], this));
+    if(bottom_is_float){
+        fwd_top_data.reset(new MKLDNNData<Dtype>(usr_top_data_mpd, prv_fwd_top_data_mpd, top[0], this, true, scale));
+    } else{
+        fwd_top_data.reset(new MKLDNNData<Dtype>(usr_top_data_mpd, prv_fwd_top_data_mpd, top[0], this, fl));
+    }
     fwd_top_data_memory = fwd_top_data->create_output_memory();
 
     if (propagation == prop_kind::forward_training &&
diff --git a/src/caffe/mkldnn_base.cpp b/src/caffe/mkldnn_base.cpp
index 7f07478ba..a20c5b8ae 100644
--- a/src/caffe/mkldnn_base.cpp
+++ b/src/caffe/mkldnn_base.cpp
@@ -66,6 +66,39 @@ shared_ptr<MKLDNNStream>  MKLDNNPrimitive<Dtype>::submit() {
     return mkldnn_stream;
 }
 
+template <typename Dtype>
+MKLDNNLayer<Dtype>::MKLDNNLayer(const LayerParameter &param) :
+  BaseQuantLayer<Dtype>() {
+  if (param.has_quantization_param()) {
+    this->precision_ = param.quantization_param().precision();
+    this->rounding_ = param.quantization_param().rounding_scheme();
+    switch (this->precision_) {
+    case QuantizationParameter_Precision_DYNAMIC_FIXED_POINT:
+      this->bw_layer_in_ = param.quantization_param().bw_layer_in();
+      this->bw_layer_out_ = param.quantization_param().bw_layer_out();
+      this->bw_params_ = param.quantization_param().bw_params();
+      for (int i = 0; i < param.quantization_param().fl_layer_in_size(); i++)
+        this->fl_layer_in_.push_back(param.quantization_param().fl_layer_in(i));
+      for (int i = 0; i < param.quantization_param().fl_layer_out_size(); i++)
+        this->fl_layer_out_.push_back(param.quantization_param().fl_layer_out(i));
+      for (int i = 0; i < param.quantization_param().fl_params_size(); i++)
+        this->fl_params_.push_back(param.quantization_param().fl_params(i));
+      //floating point
+      for (int i = 0; i < param.quantization_param().scale_in_size(); i++)
+        this->scale_in_.push_back(param.quantization_param().scale_in(i));
+      for (int i = 0; i < param.quantization_param().scale_out_size(); i++)
+        this->scale_out_.push_back(param.quantization_param().scale_out(i));
+      for (int i = 0; i < param.quantization_param().scale_params_size(); i++)
+        this->scale_params_.push_back(param.quantization_param().scale_params(i));
+
+      break;
+    default:
+      LOG(FATAL) << "Unknown precision mode: " << this->precision_;
+      break;
+    }
+  }
+}
+
 template class MKLDNNLayer<double>;
 template class MKLDNNLayer<float>;
 template class MKLDNNPrimitive<double>;
diff --git a/src/caffe/mkldnn_memory.cpp b/src/caffe/mkldnn_memory.cpp
index 9601e41ee..d2c170ee4 100644
--- a/src/caffe/mkldnn_memory.cpp
+++ b/src/caffe/mkldnn_memory.cpp
@@ -46,15 +46,42 @@ template <typename Dtype>
 MKLDNNMemoryDescriptorBase<Dtype>::MKLDNNMemoryDescriptorBase(shared_ptr<memory::primitive_desc> usr_memory_pd
                                                             , shared_ptr<memory::primitive_desc> prv_memory_pd
                                                             , Blob<Dtype>* blob
-                                                            , MKLDNNLayer<Dtype>* mkldnn_layer)
+                                                            , MKLDNNLayer<Dtype>* mkldnn_layer
+                                                            , bool is_float
+                                                            , std::vector<float> scale
+                                                            , bool is_sum)
                                     : name("MKLDNNMemoryDescriptorBase")
                                     , _reorder_usr2prv_pd(), _reorder_prv2usr_pd(), _reorder_extprv2prv_pd()
                                     ,_prv_memory(), _internal_ptr(NULL), _usr_memory(), _cpu_ptr(NULL)
                                     , _mkldnn_layer(NULL)
 {
-    set_usr_memory_pd(usr_memory_pd);
-    set_prv_memory_pd(prv_memory_pd);
+    set_usr_memory_pd(usr_memory_pd, scale);
+    set_prv_memory_pd(prv_memory_pd, scale);
     set_mkldnn_layer(mkldnn_layer);
+    this->set_scale(scale);
+    this->set_sum(is_sum);
+    this->set_float(is_float);
+    this->_blob = blob;
+}
+
+template <typename Dtype>
+MKLDNNMemoryDescriptorBase<Dtype>::MKLDNNMemoryDescriptorBase(shared_ptr<memory::primitive_desc> usr_memory_pd
+                                                            , shared_ptr<memory::primitive_desc> prv_memory_pd
+                                                            , Blob<Dtype>* blob
+                                                            , MKLDNNLayer<Dtype>* mkldnn_layer
+                                                            , std::vector<int> fl
+                                                            , bool is_sum)
+                                    : name("MKLDNNMemoryDescriptorBase")
+                                    , _reorder_usr2prv_pd(), _reorder_prv2usr_pd(), _reorder_extprv2prv_pd()
+                                    ,_prv_memory(), _internal_ptr(NULL), _usr_memory(), _cpu_ptr(NULL)
+                                    , _mkldnn_layer(NULL)
+{   
+    set_usr_memory_pd(usr_memory_pd, fl);
+    set_prv_memory_pd(prv_memory_pd, fl);
+    set_mkldnn_layer(mkldnn_layer);
+    this->set_fl(fl);
+    this->set_sum(is_sum);
+    this->set_float(false);
     this->_blob = blob;
 }
 
@@ -74,29 +101,112 @@ void MKLDNNMemoryDescriptorBase<Dtype>::check_usr_with_prv_descriptors()
 }
 
 template <typename Dtype>
-void MKLDNNMemoryDescriptorBase<Dtype>::create_reorder_descriptors()
+void MKLDNNMemoryDescriptorBase<Dtype>::create_reorder_descriptors(std::vector<float> scale, std::vector<float> scale_ext, bool is_sum)
 {
     CHECK(_usr_memory_pd);
     CHECK(_prv_memory_pd);
+
+    primitive_attr attri;
+    int mask = 0;
+
     if ( *_usr_memory_pd != *_prv_memory_pd) {
+        std::vector<float> scales_u2p;
+        for(int i=0; i<scale.size(); i++){
+            scales_u2p.push_back(scale[i]);
+        }
+        attri.set_output_scales(mask, scales_u2p);
+        attri.set_int_output_round_mode(round_nearest);
         _reorder_usr2prv_pd = shared_ptr<reorder::primitive_desc>(
-                new reorder::primitive_desc(*_usr_memory_pd, *_prv_memory_pd));
+                new reorder::primitive_desc(*_usr_memory_pd, *_prv_memory_pd, attri));
 
+        std::vector<float> scales_p2u;
+        for(int i=0; i<scale.size(); i++){
+            scales_p2u.push_back(1. / scale[i]);
+        }
+        attri.set_output_scales(mask, scales_p2u); 
+        attri.set_int_output_round_mode(round_nearest);
         _reorder_prv2usr_pd = shared_ptr<reorder::primitive_desc>(
-                new reorder::primitive_desc(*_prv_memory_pd, *_usr_memory_pd));
+                new reorder::primitive_desc(*_prv_memory_pd, *_usr_memory_pd, attri));
     }
-    if ( _extprv_memory_pd && *_prv_memory_pd != *_extprv_memory_pd) {
-        _reorder_extprv2prv_pd = shared_ptr<reorder::primitive_desc>(
-                new reorder::primitive_desc(*_extprv_memory_pd, *_prv_memory_pd));
+    if ( _extprv_memory_pd && (*_prv_memory_pd != *_extprv_memory_pd || scale != scale_ext)) {
+        if(is_sum == true && scale == scale_ext && _extprv_memory_pd->desc().data.data_type == memory::data_type::s8 && _prv_memory_pd->desc().data.data_type == memory::data_type::u8){
+#ifdef DEBUG
+            LOG(INFO) << "skip s8 to u8 reorder....";
+#endif
+            _reorder_extprv2prv_pd = NULL;
+        }else{
+            std::vector<float> scales_e2p;
+            for(int i=0; i<scale.size(); i++){
+                float shift_scale = scale[i] / scale_ext[i]; //fp32->int8 blob_prv_mkldnn_mem_descr->get_scale() will always be 0 ?
+                scales_e2p.push_back(shift_scale);
+            }
+            attri.set_output_scales(mask, scales_e2p);
+            attri.set_int_output_round_mode(round_nearest);
+            _reorder_extprv2prv_pd = shared_ptr<reorder::primitive_desc>(new reorder::primitive_desc(*_extprv_memory_pd, *_prv_memory_pd, attri));
+            
+        }
     }
 }
 
+template <typename Dtype>
+void MKLDNNMemoryDescriptorBase<Dtype>::create_reorder_descriptors(std::vector<int> fl, std::vector<int> fl_ext, bool is_sum)
+{
+    CHECK(_usr_memory_pd);
+    CHECK(_prv_memory_pd);
+
+    primitive_attr attri;
+    int mask = 0;
+
+    if ( *_usr_memory_pd != *_prv_memory_pd) {
+        std::vector<float> scales_u2p;
+        for(int i=0; i<fl.size(); i++){
+            float scale = pow(2, fl[i]);
+            scales_u2p.push_back(scale);
+        }
+        attri.set_output_scales(mask, scales_u2p);
+        attri.set_int_output_round_mode(round_nearest);
+        _reorder_usr2prv_pd = shared_ptr<reorder::primitive_desc>(
+                new reorder::primitive_desc(*_usr_memory_pd, *_prv_memory_pd, attri));
+
+        std::vector<float> scales_p2u;
+        for(int i=0; i<fl.size(); i++){
+            float scale = pow(2, -fl[i]);
+            scales_p2u.push_back(scale);
+        }
+        attri.set_output_scales(mask, scales_p2u);
+        attri.set_int_output_round_mode(round_nearest);
+        _reorder_prv2usr_pd = shared_ptr<reorder::primitive_desc>(
+                new reorder::primitive_desc(*_prv_memory_pd, *_usr_memory_pd, attri));
+    }
+    if ( _extprv_memory_pd && (*_prv_memory_pd != *_extprv_memory_pd || fl != fl_ext)) {
+        if(is_sum == true && fl == fl_ext && _extprv_memory_pd->desc().data.data_type == memory::data_type::s8 && _prv_memory_pd->desc().data.data_type == memory::data_type::u8){
+#ifdef DEBUG
+            LOG(INFO) << "skip s8 to u8 reorder....";
+#endif
+            _reorder_extprv2prv_pd = NULL;
+        }else{
+            std::vector<float> scales_e2p;
+            for(int i=0; i<fl.size(); i++){
+                int shift_fl = fl[i] - fl_ext[i]; //fp32->int8 blob_prv_mkldnn_mem_descr->get_fl() will always be 0 ?
+                float scale = pow(2, shift_fl);
+                scales_e2p.push_back(scale);
+            }
+            attri.set_output_scales(mask, scales_e2p);
+            attri.set_int_output_round_mode(round_nearest);
+            _reorder_extprv2prv_pd = shared_ptr<reorder::primitive_desc>(new reorder::primitive_desc(*_extprv_memory_pd, *_prv_memory_pd, attri));
+
+        }
+    }
+}
 
 template <typename Dtype, bool is_diff>
  MKLDNNMemoryDescriptor<Dtype, is_diff>::MKLDNNMemoryDescriptor(shared_ptr<memory::primitive_desc> usr_memory_pd
                         , shared_ptr<memory::primitive_desc> prv_memory_pd
-                        , Blob<Dtype>* blob, MKLDNNLayer<Dtype>* mkldnn_layer)
-        : MKLDNNMemoryDescriptorBase<Dtype>(usr_memory_pd, prv_memory_pd, blob, mkldnn_layer)
+                        , Blob<Dtype>* blob, MKLDNNLayer<Dtype>* mkldnn_layer
+                        , bool is_float
+                        , std::vector<float> scale
+                        , bool is_sum)
+        : MKLDNNMemoryDescriptorBase<Dtype>(usr_memory_pd, prv_memory_pd, blob, mkldnn_layer, is_float, scale, is_sum)
 {
     const Dtype* prv_ptr = is_diff ?  blob->prv_diff() : blob->prv_data();
 
@@ -106,11 +216,36 @@ template <typename Dtype, bool is_diff>
         LOG(INFO) << "Format of blob-prv-memory-pd: " << blob_prv_mkldnn_mem_descr->prv_memory_pd()->desc().data.format;
         LOG(INFO) << "Format of this-prv-memory-pd: " << this->prv_memory_pd()->desc().data.format;
 #endif
-        if (*blob_prv_mkldnn_mem_descr->prv_memory_pd() !=  *this->prv_memory_pd()) {
+        if (*blob_prv_mkldnn_mem_descr->prv_memory_pd() !=  *this->prv_memory_pd() || blob_prv_mkldnn_mem_descr->get_scale() != this->get_scale()) {
 #ifdef DEBUG
             LOG(INFO) << "Formats of blob-prv-memory-pd and this-prv-memory-pd are not equal !";
 #endif
-            this->set_extprv_memory_pd(blob_prv_mkldnn_mem_descr->prv_memory_pd());
+            this->set_extprv_memory_pd(blob_prv_mkldnn_mem_descr->prv_memory_pd(), scale, blob_prv_mkldnn_mem_descr->get_scale(), blob_prv_mkldnn_mem_descr->get_sum());
+        }
+    }
+}
+
+template <typename Dtype, bool is_diff>
+ MKLDNNMemoryDescriptor<Dtype, is_diff>::MKLDNNMemoryDescriptor(shared_ptr<memory::primitive_desc> usr_memory_pd
+                        , shared_ptr<memory::primitive_desc> prv_memory_pd
+                        , Blob<Dtype>* blob, MKLDNNLayer<Dtype>* mkldnn_layer
+                        , std::vector<int> fl
+                        , bool is_sum)
+        : MKLDNNMemoryDescriptorBase<Dtype>(usr_memory_pd, prv_memory_pd, blob, mkldnn_layer, fl, is_sum)
+{
+    const Dtype* prv_ptr = is_diff ?  blob->prv_diff() : blob->prv_data();
+
+    if (prv_ptr != NULL) {
+        shared_ptr<MKLDNNMemoryDescriptor<Dtype, is_diff> > blob_prv_mkldnn_mem_descr = get_mkldnn_prv_descriptor<Dtype, is_diff>(blob);
+#ifdef DEBUG
+        LOG(INFO) << "Format of blob-prv-memory-pd: " << blob_prv_mkldnn_mem_descr->prv_memory_pd()->desc().data.format;
+        LOG(INFO) << "Format of this-prv-memory-pd: " << this->prv_memory_pd()->desc().data.format;
+#endif
+        if (*blob_prv_mkldnn_mem_descr->prv_memory_pd() !=  *this->prv_memory_pd() || blob_prv_mkldnn_mem_descr->get_fl() != this->get_fl()) {
+#ifdef DEBUG
+            LOG(INFO) << "Formats of blob-prv-memory-pd and this-prv-memory-pd are not equal !";
+#endif
+            this->set_extprv_memory_pd(blob_prv_mkldnn_mem_descr->prv_memory_pd(), fl, blob_prv_mkldnn_mem_descr->get_fl(), blob_prv_mkldnn_mem_descr->get_sum());
         }
     }
 }
@@ -141,8 +276,8 @@ void MKLDNNMemoryDescriptor<Dtype, is_diff>::convert_to_prv(void* cpu_ptr)
     VLOG(1) << "--- MKLDNNMemoryDescriptorBase<Dtype>::convert_to_prv --- " << this->name;
 #ifdef DEBUG
     LOG(INFO) << "Reorder: from usr to prv.";
-    LOG(INFO) << "Format of _usr_memory_pd: " << this->_usr_memory_pd->desc().data.format;
-    LOG(INFO) << "Format of _prv_memory_pd: " << this->_prv_memory_pd->desc().data.format;
+    LOG(INFO) << "Format of _usr_memory_pd: " << this->_usr_memory_pd->desc().data.format << "   Data_type of _usr_memory_pd: " << this->_usr_memory_pd->desc().data.data_type;
+    LOG(INFO) << "Format of _prv_memory_pd: " << this->_prv_memory_pd->desc().data.format << "   Data_type of _prv_memory_pd: " << this->_prv_memory_pd->desc().data.data_type;
 #endif
     PERFORMANCE_MEASUREMENT_BEGIN();
     this->_reorder_usr2prv.submit();
@@ -180,6 +315,8 @@ void MKLDNNMemoryDescriptor<Dtype, is_diff>::convert_from_prv(void* cpu_ptr)
     LOG(INFO) << "Reorder: from prv to usr.";
     LOG(INFO) << "Format of _prv_memory_pd: " << this->_prv_memory_pd->desc().data.format;
     LOG(INFO) << "Format of _usr_memory_pd: " << this->_usr_memory_pd->desc().data.format;
+    LOG(INFO) << "Format of _prv_memory_pd: " << this->_prv_memory_pd->desc().data.format << "   Data_type of _prv_memory_pd: " << this->_prv_memory_pd->desc().data.data_type;
+    LOG(INFO) << "Format of _usr_memory_pd: " << this->_usr_memory_pd->desc().data.format << "   Data_type of _usr_memory_pd: " << this->_usr_memory_pd->desc().data.data_type;
 #endif
     PERFORMANCE_MEASUREMENT_BEGIN();
     this->_reorder_prv2usr.submit();
@@ -206,19 +343,19 @@ void MKLDNNMemoryDescriptor<Dtype, is_diff>::convert_from_extprv(shared_ptr<prim
     CHECK(aprimitive);
     if(this->_reorder_extprv2prv_pd == NULL)
         return;
-    if (*this->_extprv_memory_pd == *this->_prv_memory_pd)
-    {
-#ifdef DEBUG
-        LOG(INFO) << "The format and data_type of _extprv_memory_pd and _prv_memory_pd is same, no need do conversion.";
-#endif
-        return;
-    }
+//    if (*this->_extprv_memory_pd == *this->_prv_memory_pd)
+//    {
+//#ifdef DEBUG
+//        LOG(INFO) << "The format and data_type of _extprv_memory_pd and _prv_memory_pd is same, no need do conversion.";
+//#endif
+//        return;
+//    }
     create_reorder_from_extprv(aprimitive);
     VLOG(1) << "--- MKLDNNMemoryDescriptorBase<Dtype>::convert_from_extprv --- " << this->name;
 #ifdef DEBUG
     LOG(INFO) << "Reorder: from extprv to prv.";
-    LOG(INFO) << "Format of _extprv_memory_pd: " << this->_extprv_memory_pd->desc().data.format;
-    LOG(INFO) << "Format of _prv_memory_pd: " << this->_prv_memory_pd->desc().data.format;
+    LOG(INFO) << "Format of _extprv_memory_pd: " << this->_extprv_memory_pd->desc().data.format << "   Data_type of _extprv_memory_pd: " << this->_extprv_memory_pd->desc().data.data_type;
+    LOG(INFO) << "Format of _prv_memory_pd: " << this->_prv_memory_pd->desc().data.format<< "   Data_type of _prv_memory_pd: " << this->_prv_memory_pd->desc().data.data_type;
 #endif
     PERFORMANCE_MEASUREMENT_BEGIN();
     this->_reorder_extprv2prv.submit();
@@ -260,6 +397,10 @@ shared_ptr<primitive> MKLDNNMemoryDescriptor<Dtype, is_diff>::get_blob_prv_primi
                                             ,bool set_prv_ptr, bool convert
                                             ,MKLDNNMemoryDescriptor<Dtype,is_diff>* converted_in_fwd)
 {
+#ifdef DEBUG        
+    LOG(INFO) << "GET_BLOB_PRV_PRIMITIVE";
+#endif
+
     if (!this->conversion_needed()) {
         return shared_ptr<primitive>(); // TODO: may be CHECK ?
     }
@@ -271,10 +412,12 @@ shared_ptr<primitive> MKLDNNMemoryDescriptor<Dtype, is_diff>::get_blob_prv_primi
             // TODO: use previously done conversion on forward - needed for training
             NOT_IMPLEMENTED;
         }
-        if(convert)
+        if(convert) {
             this->convert_to_prv(const_cast<Dtype*>(is_diff ? blob->cpu_diff() : blob->cpu_data()));
-        else
+        }
+        else {
             this->create_reorder_to_prv(const_cast<Dtype*>(is_diff ? blob->cpu_diff() : blob->cpu_data()));
+        }
         if (set_prv_ptr) {
             if (is_diff) {
                 blob->set_prv_diff_descriptor(this->get_shared_ptr(), false);
@@ -291,17 +434,35 @@ shared_ptr<primitive> MKLDNNMemoryDescriptor<Dtype, is_diff>::get_blob_prv_primi
         return this->reorder_usr2prv();
     } else {
         shared_ptr<MKLDNNMemoryDescriptor<Dtype, is_diff> > blob_prv_mkldnn_mem_descr = get_mkldnn_prv_descriptor<Dtype, is_diff>(blob);
-
-        if (*blob_prv_mkldnn_mem_descr->prv_memory_pd() !=  *this->prv_memory_pd()) {
-            // prv in blob and in this descrptor may have different layouts
-            if(convert)
-                this->convert_from_extprv(blob_prv_mkldnn_mem_descr->aprimitive());
-            else
-                this->create_reorder_from_extprv(blob_prv_mkldnn_mem_descr->aprimitive());
-            return this->reorder_extprv2prv();
-        } else if (blob_prv_mkldnn_mem_descr.get() != this) {
-            VLOG(1) << "layout OK " << blob_prv_mkldnn_mem_descr->name << " == " << this->name;
-        }
+        if(blob_prv_mkldnn_mem_descr->get_float() || this->get_float()){
+            if ((*blob_prv_mkldnn_mem_descr->prv_memory_pd() !=  *this->prv_memory_pd() || blob_prv_mkldnn_mem_descr->get_scale() != this->get_scale()) && this->_reorder_extprv2prv_pd != NULL) {
+                // prv in blob and in this descrptor may have different layouts
+                if(convert) {
+                    LOG(INFO) << "BAD CONVERT";
+                    this->convert_from_extprv(blob_prv_mkldnn_mem_descr->aprimitive());
+                }
+                else {
+                    this->create_reorder_from_extprv(blob_prv_mkldnn_mem_descr->aprimitive());
+                }
+                return this->reorder_extprv2prv();
+            } else if (blob_prv_mkldnn_mem_descr.get() != this) {
+                VLOG(1) << "layout OK " << blob_prv_mkldnn_mem_descr->name << " == " << this->name;
+            }
+        } else{
+            if ((*blob_prv_mkldnn_mem_descr->prv_memory_pd() !=  *this->prv_memory_pd() || blob_prv_mkldnn_mem_descr->get_fl() != this->get_fl()) && this->_reorder_extprv2prv_pd != NULL) {
+                // prv in blob and in this descrptor may have different layouts
+                if(convert) {
+                    LOG(INFO) << "BAD CONVERT";
+                    this->convert_from_extprv(blob_prv_mkldnn_mem_descr->aprimitive());
+                }
+                else {
+                    this->create_reorder_from_extprv(blob_prv_mkldnn_mem_descr->aprimitive());
+                }
+                return this->reorder_extprv2prv();
+            } else if (blob_prv_mkldnn_mem_descr.get() != this) {
+                VLOG(1) << "layout OK " << blob_prv_mkldnn_mem_descr->name << " == " << this->name;
+            }
+        }          
         return blob_prv_mkldnn_mem_descr->aprimitive();
     }
     NOT_IMPLEMENTED;
@@ -312,6 +473,10 @@ shared_ptr<primitive> MKLDNNMemoryDescriptor<Dtype, is_diff>::get_blob_prv_primi
 template <typename Dtype, bool is_diff>
 void MKLDNNMemoryDescriptor<Dtype, is_diff>::sync_before_read()
 {
+#ifdef DEBUG        
+    LOG(INFO) << "SYNC_BEFORE_READ";
+#endif
+
     // TODO: need to optimize code
     if (!this->conversion_needed()) {
         return;
@@ -344,14 +509,33 @@ void MKLDNNMemoryDescriptor<Dtype, is_diff>::sync_before_read()
     } else {
         shared_ptr<MKLDNNMemoryDescriptor<Dtype, is_diff> > blob_prv_mkldnn_mem_descr = get_mkldnn_prv_descriptor<Dtype, is_diff>(this->_blob);
 
-        if (*blob_prv_mkldnn_mem_descr->prv_memory_pd() !=  *this->prv_memory_pd()) {
-            // prv in blob and in this descrptor may have different layouts
-            this->convert_from_extprv(blob_prv_mkldnn_mem_descr->aprimitive());
-        } else {
-            if (is_diff) {
-                this->_blob->mutable_prv_diff();
+        if(blob_prv_mkldnn_mem_descr->get_float() || this->get_float()){
+            if (*blob_prv_mkldnn_mem_descr->prv_memory_pd() !=  *this->prv_memory_pd() || blob_prv_mkldnn_mem_descr->get_scale() != this->get_scale()) {
+                // prv in blob and in this descrptor may have different layouts
+#ifdef DEBUG
+            LOG(INFO) << "Convert from extprv";
+#endif
+                this->convert_from_extprv(blob_prv_mkldnn_mem_descr->aprimitive());
+            } else {
+                if (is_diff) {
+                    this->_blob->mutable_prv_diff();
+                } else {
+                    this->_blob->mutable_prv_data();
+                }
+            }
+        } else{
+            if (*blob_prv_mkldnn_mem_descr->prv_memory_pd() !=  *this->prv_memory_pd() || blob_prv_mkldnn_mem_descr->get_fl() != this->get_fl()) {
+                // prv in blob and in this descrptor may have different layouts
+#ifdef DEBUG
+            LOG(INFO) << "Convert from extprv";
+#endif
+                this->convert_from_extprv(blob_prv_mkldnn_mem_descr->aprimitive());
             } else {
-                this->_blob->mutable_prv_data();
+                if (is_diff) {
+                    this->_blob->mutable_prv_diff();
+                } else {
+                    this->_blob->mutable_prv_data();
+                }
             }
         }
     }
diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
index 2118394ec..646b66b8d 100644
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -1109,6 +1109,106 @@ bool Net<Dtype>::StateMeetsRule(const NetState& state,
   return true;
 }
 
+template <typename Dtype>
+vector<Dtype> Net<Dtype>::FindMax(Blob<Dtype>* blob, bool is_single) {
+  const Dtype* data = blob->cpu_data();
+  int cnt = blob->count();
+  vector<Dtype> max_vals;
+  Dtype max_val = (Dtype)(-10);
+
+  int index = 0;
+  if(blob->shape().size() == 4) {
+    if(is_single) {
+      max_vals = vector<Dtype>(1, Dtype(-10));
+      for (int i = 0; i < cnt; ++i) {
+        max_val = std::max(max_val, (Dtype)fabs(data[i]));
+      }
+      max_vals.at(0) = max_val;
+    } else { // output_channel * input_channel * kernel_height * kernel_width
+      int height = blob->shape(2);
+      int width = blob->shape(3);
+      int channel = blob->shape(0);
+      max_vals = vector<Dtype>(channel, Dtype(-10));
+      int step = blob->shape(1) * height * width;
+      for (int i = 0; i < cnt; ++i) {
+        if((i + 1) % step == 0) {
+          max_vals.at(index) = std::max(max_val, (Dtype)fabs(data[i]));
+          ++index;
+        } else {
+          max_val = std::max(max_val, (Dtype)fabs(data[i]));
+        }
+      }
+    }
+  } else {
+    if(is_single) {
+      max_vals = vector<Dtype>(1, Dtype(-10));
+      for (int i = 0; i < cnt; ++i) {
+        max_val = std::max(max_val, (Dtype)fabs(data[i]));
+      }
+      max_vals.at(0) = max_val;
+    } else { // output_channel * input_channel
+      int channel = blob->shape(0);
+      max_vals = vector<Dtype>(channel, Dtype(-10));
+      int step = blob->shape(1);
+      for (int i = 0; i < cnt; ++i) {
+        if((i + 1) % step == 0) {
+          max_vals.at(index) = std::max(max_val, (Dtype)fabs(data[i]));
+          ++index;
+        } else {
+          max_val = std::max(max_val, (Dtype)fabs(data[i]));
+        }
+      }
+    }
+  }
+  
+  return max_vals;
+}
+
+template <typename Dtype>
+void Net<Dtype>::RangeInLayers(vector<string>* layer_name,
+      vector<Dtype>* max_in, vector<Dtype>* max_out, vector<vector<Dtype>>* max_param, string scaling) {
+  // Initialize vector elements, if needed.
+  if(layer_name->size()==0) {
+    for (int layer_id = 0; layer_id < layers_.size(); ++layer_id) {
+      if (strcmp(layers_[layer_id]->type(), "Convolution") == 0) {
+        layer_name->push_back(this->layer_names()[layer_id]);
+        max_in->push_back(0);
+        max_out->push_back(0);
+        if (scaling == "single") {
+          max_param->push_back(vector<Dtype>(1, 0));
+        }
+        else {
+          int param_shape = (&(*layers_[layer_id]->blobs()[0]))->shape(0);
+          max_param->push_back(vector<Dtype>(param_shape, 0));
+        }
+      }
+    }
+  }
+  // Find maximal values.
+  int index = 0;
+  vector<Dtype> max_vals;
+  for (int layer_id = 0; layer_id < layers_.size(); ++layer_id) {
+    if (strcmp(layers_[layer_id]->type(), "Convolution") == 0) {
+      max_vals = FindMax(bottom_vecs_[layer_id][0]);
+      max_in->at(index) = std::max(max_in->at(index), max_vals.at(0)); 
+
+      max_vals = FindMax(top_vecs_[layer_id][0]);
+      max_out->at(index) = std::max(max_out->at(index), max_vals.at(0));
+
+      // Consider the weights only, ignore the bias
+      if (scaling == "single") {
+        max_vals = FindMax(&(*layers_[layer_id]->blobs()[0]));
+        max_param->at(index).at(0) = std::max(max_param->at(index).at(0), max_vals.at(0));
+      } else {
+        max_vals = FindMax(&(*layers_[layer_id]->blobs()[0]), false);
+        for(int i = 0; i < max_vals.size(); ++i) 
+          max_param->at(index).at(i) = std::max(max_param->at(index).at(i), max_vals.at(i));
+      }
+      index++;
+    }
+  }
+}
+
 // Helper for Net::Init: add a new top blob to the net.
 template <typename Dtype>
 void Net<Dtype>::AppendTop(const NetParameter& param, const int layer_id,
@@ -1281,7 +1381,6 @@ Dtype Net<Dtype>::ForwardFromTo(int start, int end) {
     LAYER_TIMING_START(forward, i);
     PERFORMANCE_MEASUREMENT_BEGIN();
 
-    // LOG(ERROR) << "Forwarding " << layer_names_[i];
     Dtype layer_loss = layers_[i]->Forward(bottom_vecs_[i], top_vecs_[i]);
 
     PERFORMANCE_MEASUREMENT_END((std::string("FW_") + layer_names_[i]).c_str());
diff --git a/src/caffe/proto/caffe.proto b/src/caffe/proto/caffe.proto
index 439415c26..cfbfdb55c 100755
--- a/src/caffe/proto/caffe.proto
+++ b/src/caffe/proto/caffe.proto
@@ -609,6 +609,7 @@ message LayerParameter {
   optional MultinodeLayerParameter multinode = 150;
   optional MnActivationParameter mn_activation_param = 151;
   optional MnParamGradCompressParameter mn_grad_compress_param = 156;
+  optional QuantizationParameter quantization_param = 158;
 }
 
 message MultinodeLayerParameter {
@@ -630,7 +631,27 @@ message MnActivationParameter {
   optional bool need_reduce = 5 [default = true];
 }
 
-
+// Message for layers with reduced word with arithmetic
+message QuantizationParameter{
+  enum Precision {
+    DYNAMIC_FIXED_POINT = 0;
+  }
+  optional Precision precision = 1 [default = DYNAMIC_FIXED_POINT];
+  enum Rounding {
+    NEAREST = 0;
+  }
+  optional Rounding rounding_scheme = 2 [default = NEAREST];
+  // Dynamic fixed point word width
+  optional uint32 bw_layer_in = 3 [default = 32];
+  optional uint32 bw_layer_out = 4 [default = 32];
+  optional uint32 bw_params = 5 [default = 32];
+  repeated int32 fl_layer_in = 6;
+  repeated int32 fl_layer_out = 7;
+  repeated int32 fl_params = 8;
+  repeated float scale_in = 20;
+  repeated float scale_out = 21;
+  repeated float scale_params = 22;
+}
 
 message MnParamGradCompressParameter {
   repeated bool param_grad_compress_enable = 1;
diff --git a/src/caffe/quant/layers/base_quant_layer.cpp b/src/caffe/quant/layers/base_quant_layer.cpp
new file mode 100644
index 000000000..1055adc47
--- /dev/null
+++ b/src/caffe/quant/layers/base_quant_layer.cpp
@@ -0,0 +1,56 @@
+/*
+All modification made by Intel Corporation: © 2016 Intel Corporation
+
+All contributions by the University of California:
+Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
+All rights reserved.
+
+All other contributions:
+Copyright (c) 2014, 2015, the respective contributors
+All rights reserved.
+For the list of contributors go to https://github.com/BVLC/caffe/blob/master/CONTRIBUTORS.md
+
+A part of the code referenced BVLC CAFFE ristretto branch
+For the original code go to https://github.com/pmgysel/caffe 
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+    * Redistributions of source code must retain the above copyright notice,
+      this list of conditions and the following disclaimer.
+    * Redistributions in binary form must reproduce the above copyright
+      notice, this list of conditions and the following disclaimer in the
+      documentation and/or other materials provided with the distribution.
+    * Neither the name of Intel Corporation nor the names of its contributors
+      may be used to endorse or promote products derived from this software
+      without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+*/
+
+#include <math.h>
+#include <algorithm>
+#include <stdlib.h>
+#include <time.h>
+
+#include "caffe/mkldnn_memory.hpp"
+#include "caffe/quant/base_quant_layer.hpp"
+
+namespace caffe {
+
+template <typename Dtype>
+BaseQuantLayer<Dtype>::BaseQuantLayer() : need_quantize_(false), is_float_(false) {
+}
+
+INSTANTIATE_CLASS(BaseQuantLayer);
+
+}  // namespace caffe
diff --git a/src/caffe/quant/quantization.cpp b/src/caffe/quant/quantization.cpp
new file mode 100644
index 000000000..ae312869b
--- /dev/null
+++ b/src/caffe/quant/quantization.cpp
@@ -0,0 +1,331 @@
+/*
+All modification made by Intel Corporation: © 2016 Intel Corporation
+
+All contributions by the University of California:
+Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
+All rights reserved.
+
+All other contributions:
+Copyright (c) 2014, 2015, the respective contributors
+All rights reserved.
+For the list of contributors go to https://github.com/BVLC/caffe/blob/master/CONTRIBUTORS.md
+
+A part of the code referenced BVLC CAFFE ristretto branch
+For the original code go to https://github.com/pmgysel/caffe 
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+    * Redistributions of source code must retain the above copyright notice,
+      this list of conditions and the following disclaimer.
+    * Redistributions in binary form must reproduce the above copyright
+      notice, this list of conditions and the following disclaimer in the
+      documentation and/or other materials provided with the distribution.
+    * Neither the name of Intel Corporation nor the names of its contributors
+      may be used to endorse or promote products derived from this software
+      without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+*/
+
+#include "boost/algorithm/string.hpp"
+
+#include "caffe/caffe.hpp"
+#include "caffe/net.hpp"
+#include "caffe/quant/quantization.hpp"
+
+using caffe::Caffe;
+using caffe::Net;
+using caffe::string;
+using caffe::vector;
+using caffe::Blob;
+using caffe::LayerParameter;
+using caffe::NetParameter;
+
+Quantization::Quantization(string model, string weights, string model_quantized,
+      int iterations, string trimming_mode, double error_margin, int score_number, string scaling, int detection, int power) {
+  this->model_ = model;
+  this->weights_ = weights;
+  this->model_quantized_ = model_quantized;
+  this->iterations_ = iterations;
+  this->trimming_mode_ = trimming_mode;
+  this->error_margin_ = error_margin;
+  this->score_number = score_number;
+  this->scaling = scaling;
+  this->detection = detection;
+  this->power = power;
+}
+
+void Quantization::QuantizeNet() {
+  CheckWritePermissions(model_quantized_);
+
+  float accuracy;
+  Net<float>* net_test = new Net<float>(model_, caffe::TEST);
+  net_test->CopyTrainedLayersFrom(weights_);
+  RunForwardBatches(this->iterations_, net_test, &accuracy, true, this->score_number); // RangeInLayer during sampling
+  delete net_test;
+
+  // Do network quantization and scoring.
+  if (trimming_mode_ == "dynamic_fixed_point") {
+    Quantize2DynamicFixedPoint();
+  } else {
+    LOG(FATAL) << "Unknown trimming mode: " << trimming_mode_;
+  }
+}
+
+void Quantization::CheckWritePermissions(const string path) {
+  std::ofstream probe_ofs(path.c_str());
+  if (probe_ofs.good()) {
+    probe_ofs.close();
+    std::remove(path.c_str());
+  } else {
+    LOG(FATAL) << "Missing write permissions";
+  }
+}
+
+void Quantization::RunForwardBatches(const int iterations,
+      Net<float>* caffe_net, float* accuracy, const bool do_stats,
+      const int score_number) {
+  LOG(INFO) << "Running for " << iterations << " iterations.";
+  vector<Blob<float>* > bottom_vec;
+  vector<int> test_score_output_id;
+  vector<float> test_score;
+  float loss = 0;
+  for (int i = 0; i < iterations; ++i) {
+    float iter_loss;
+    // Do forward propagation.
+    const vector<Blob<float>*>& result =
+        caffe_net->Forward(bottom_vec, &iter_loss);
+    // Find maximal values in network.
+    if(do_stats) {
+      caffe_net->RangeInLayers(&layer_names_, &max_in_, &max_out_, &max_params_, this->scaling);
+    }
+    // Keep track of network score over multiple batches.
+    loss += iter_loss;
+    if (this->detection) continue;
+
+    int idx = 0;
+    for (int j = 0; j < result.size(); ++j) {
+      const float* result_vec = result[j]->cpu_data();
+      for (int k = 0; k < result[j]->count(); ++k, ++idx) {
+        const float score = result_vec[k];
+        if (i == 0) {
+          test_score.push_back(score);
+          test_score_output_id.push_back(j);
+        } else {
+          test_score[idx] += score;
+        }
+      }
+    }
+    LOG(INFO) << "Iteration: " << i;
+  }
+  loss /= iterations;
+  LOG(INFO) << "Loss: " << loss;
+  if (this->detection) return;
+
+  for (int i = 0; i < test_score.size(); ++i) {
+    const float loss_weight = caffe_net->blob_loss_weights()[
+        caffe_net->output_blob_indices()[test_score_output_id[i]]];
+    std::ostringstream loss_msg_stream;
+    const float mean_score = test_score[i] / iterations;
+    if (loss_weight) {
+      loss_msg_stream << " (* " << loss_weight
+                      << " = " << loss_weight * mean_score << " loss)";
+    }
+  }
+  *accuracy = test_score[score_number] / iterations;
+}
+
+void Quantization::Quantize2DynamicFixedPoint() {
+  // Find the integer length for dynamic fixed point numbers.
+  // The integer length is chosen such that no saturation occurs.
+  // This approximation assumes an infinitely long factional part.
+  // For layer activations, we reduce the integer length by one bit.
+  vector<int> lens;
+  vector<float> scales;
+  for (int i = 0; i < layer_names_.size(); ++i) {
+    if (this->power) {
+      il_in_.push_back((int)ceil(log2(max_in_[i])));
+      il_out_.push_back((int)ceil(log2(max_out_[i])));
+    } else {
+      scale_in_.push_back(max_in_[i]);
+      scale_out_.push_back(max_out_[i]);
+    }
+    if (this->scaling == "single") {
+      if (this->power)
+        lens.push_back((int)ceil(log2(max_params_[i][0])+1));
+      else
+        scales.push_back(max_params_[i][0]);
+    } else {
+      for (int j = 0; j < max_params_[i].size(); j++) {
+        if (this->power)
+          lens.push_back((int)ceil(log2(max_params_[i][j])+1));
+        else
+          scales.push_back(max_params_[i][j]+0.0);
+      }
+    }
+    if (this->power) {
+      il_params_.push_back(lens);
+      lens.clear();
+    } else {
+      scale_params_.push_back(scales);
+      scales.clear();
+    }
+  }
+  // Debug
+  for (int k = 0; k < layer_names_.size(); ++k) {
+    if (this->scaling != "single") {
+      if (this->power)
+        LOG(INFO) << "Layer " << layer_names_[k] << ", parameters channel=" << il_params_[k].size();
+      else
+        LOG(INFO) << "Layer " << layer_names_[k] << ", parameters channel=" << scale_params_[k].size();
+    }
+
+    if (this->power) {
+      LOG(INFO) << "Integer length input=" << il_in_[k];
+      LOG(INFO) << "Integer length output=" << il_out_[k];
+    } else {
+      LOG(INFO) << "Scale input=" << scale_in_[k];
+      LOG(INFO) << "Scale output=" << scale_out_[k];
+    }
+   
+    if (this->scaling == "single") {
+      if (this->power)
+        LOG(INFO) << "Integer length param=" << il_params_[k][0];
+      else
+        LOG(INFO) << "Scale param=" << scale_params_[k][0];
+    } else {
+      for (int j = 0; j < il_params_[k].size(); j++) {
+        if (this->power)
+          LOG(INFO) << "Integer length params[" << j << "]=" << il_params_[k][j];
+        else
+          LOG(INFO) << "Scale params[" << j << "]=" << scale_params_[k][j];
+      }
+    }
+  }
+
+  // Choose bit-width for different network parts
+  bw_conv_params_ = 8; 
+  bw_out_ = 8;
+  bw_in_ = bw_out_;
+
+  NetParameter param;
+  // Score dynamic fixed point network.
+  // This network combines dynamic fixed point parameters in convolutional and
+  // inner product layers, as well as dynamic fixed point activations.
+  caffe::ReadNetParamsFromTextFileOrDie(model_, &param);
+  EditNetDescriptionDynamicFixedPoint(&param, "Convolution",
+      "Parameters_and_Activations", bw_conv_params_, bw_in_,
+      bw_out_);
+  WriteProtoToTextFile(param, model_quantized_);
+}
+
+void Quantization::EditNetDescriptionDynamicFixedPoint(NetParameter* param,
+      const string layer_quantize, const string net_part, const int bw_conv,
+      const int bw_in, const int bw_out) {
+  int index = 0;
+  bool first_convolution = false;
+  for (int i = 0; i < param->layer_size(); ++i) {
+    // TODO: move first convolution check to transform script
+    if (layer_quantize.find("Convolution") != string::npos &&
+        param->layer(i).type().find("Convolution") != string::npos) {
+      if (!first_convolution) {
+          first_convolution = true;
+          continue;
+      }
+
+      // quantize parameters
+      if (net_part.find("Parameters") != string::npos) {
+        LayerParameter* param_layer = param->mutable_layer(i);
+        param_layer->set_type("Convolution");
+        if (trimming_mode_ == "dynamic_fixed_point") {
+          param_layer->mutable_quantization_param()->set_bw_params(bw_conv);
+          if (this->power) {
+            vector<int> vals = GetIntegerLengthParams(param->layer(i).name());
+            for (int j = 0; j < vals.size(); j++) {
+              vals[j] = bw_conv - vals[j];
+              param_layer->mutable_quantization_param()->add_fl_params(vals[j]);
+            }
+          } else {
+            vector<float> vals = GetScaleParams(param->layer(i).name());
+            for (int j = 0; j < vals.size(); j++) {
+              param_layer->mutable_quantization_param()->add_scale_params(vals[j]);
+            }
+          }
+        }
+      }
+      // quantize activations
+      if (net_part.find("Activations") != string::npos) {
+        LayerParameter* param_layer = param->mutable_layer(i);
+        param_layer->set_type("Convolution");
+        if (trimming_mode_ == "dynamic_fixed_point") {
+          param_layer->mutable_quantization_param()->set_bw_layer_in(bw_in);
+          param_layer->mutable_quantization_param()->set_bw_layer_out(bw_out);
+          if (this->power) {
+            int val = GetIntegerLengthIn(param->layer(i).name());
+            param_layer->mutable_quantization_param()->add_fl_layer_in(bw_in - val);
+            val = GetIntegerLengthOut(param->layer(i).name());
+            param_layer->mutable_quantization_param()->add_fl_layer_out(bw_out - val);
+          } else {
+            float val = GetScaleIn(param->layer(i).name());
+            param_layer->mutable_quantization_param()->add_scale_in(val);
+            val = GetScaleOut(param->layer(i).name());
+            param_layer->mutable_quantization_param()->add_scale_out(val);
+          }
+        }
+      }
+      LayerParameter* param_layer = param->mutable_layer(i);
+      if (trimming_mode_ == "dynamic_fixed_point") {
+        param_layer->mutable_quantization_param()->set_precision(caffe::QuantizationParameter_Precision(0));
+      } else {
+        LOG(FATAL) << "Unknown trimming mode: " << trimming_mode_;
+      }
+      index++;
+    }
+  }
+}
+
+vector<int> Quantization::GetIntegerLengthParams(const string layer_name) {
+  int pos = find(layer_names_.begin(), layer_names_.end(), layer_name)
+      - layer_names_.begin();
+  return il_params_[pos];
+}
+
+int Quantization::GetIntegerLengthIn(const string layer_name) {
+  int pos = find(layer_names_.begin(), layer_names_.end(), layer_name)
+      - layer_names_.begin();
+  return il_in_[pos];
+}
+
+int Quantization::GetIntegerLengthOut(const string layer_name) {
+  int pos = find(layer_names_.begin(), layer_names_.end(), layer_name)
+      - layer_names_.begin();
+  return il_out_[pos];
+}
+
+vector<float> Quantization::GetScaleParams(const string layer_name) {
+  int pos = find(layer_names_.begin(), layer_names_.end(), layer_name)
+      - layer_names_.begin();
+  return scale_params_[pos];
+}
+
+float Quantization::GetScaleIn(const string layer_name) {
+  int pos = find(layer_names_.begin(), layer_names_.end(), layer_name)
+      - layer_names_.begin();
+  return scale_in_[pos];
+}
+
+float Quantization::GetScaleOut(const string layer_name) {
+  int pos = find(layer_names_.begin(), layer_names_.end(), layer_name)
+      - layer_names_.begin();
+  return scale_out_[pos];
+}
diff --git a/tools/caffe.cpp b/tools/caffe.cpp
index 8d78338d9..5edfaa88a 100644
--- a/tools/caffe.cpp
+++ b/tools/caffe.cpp
@@ -357,6 +357,9 @@ int test_detection(Net<float>& caffe_net) {
   PERFORMANCE_INIT_MONITOR();
 
   for (int i = 0; i < FLAGS_iterations; ++i) {
+#ifdef DEBUG
+    LOG(INFO) << "Iteration: " << i;
+#endif
     float iter_loss;
     const vector<Blob<float>*>& result = caffe_net.Forward(&iter_loss);
 
diff --git a/tools/sample.cpp b/tools/sample.cpp
new file mode 100644
index 000000000..d860aff6d
--- /dev/null
+++ b/tools/sample.cpp
@@ -0,0 +1,154 @@
+/*
+All modification made by Intel Corporation: © 2016 Intel Corporation
+
+All contributions by the University of California:
+Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
+All rights reserved.
+
+All other contributions:
+Copyright (c) 2014, 2015, the respective contributors
+All rights reserved.
+For the list of contributors go to https://github.com/BVLC/caffe/blob/master/CONTRIBUTORS.md
+
+A part of the code referenced BVLC CAFFE ristretto branch
+For the original code go to https://github.com/pmgysel/caffe 
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are met:
+
+    * Redistributions of source code must retain the above copyright notice,
+      this list of conditions and the following disclaimer.
+    * Redistributions in binary form must reproduce the above copyright
+      notice, this list of conditions and the following disclaimer in the
+      documentation and/or other materials provided with the distribution.
+    * Neither the name of Intel Corporation nor the names of its contributors
+      may be used to endorse or promote products derived from this software
+      without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
+FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+*/
+
+#include <glog/logging.h>
+
+#include <cstring>
+#include <map>
+#include <string>
+#include <vector>
+
+#include "boost/algorithm/string.hpp"
+#include "caffe/caffe.hpp"
+#include "caffe/proto/caffe.pb.h"
+#include "caffe/util/upgrade_proto.hpp"
+
+#include "caffe/quant/quantization.hpp"
+
+using caffe::Blob;
+using caffe::Caffe;
+using caffe::Net;
+using caffe::Layer;
+using caffe::Solver;
+using caffe::shared_ptr;
+using caffe::string;
+using caffe::Timer;
+using caffe::vector;
+using std::ostringstream;
+
+DEFINE_string(model, "",
+    "The model definition protocol buffer text file..");
+DEFINE_string(weights, "",
+    "The trained weights.");
+DEFINE_string(trimming_mode, "",
+    "Available options: dynamic_fixed_point.");
+DEFINE_string(model_quantized, "",
+    "The output path of the quantized net");
+DEFINE_int32(iterations, 50,
+    "Optional: The number of iterations to run.");
+DEFINE_double(error_margin, 2,
+    "Optional: the allowed accuracy drop in %");
+DEFINE_int32(score_number, 0,
+    "Optional: The score number to run.");
+DEFINE_string(scaling, "single",
+    "The scaling model: single or multiple");
+DEFINE_int32(detection, 0,
+    "Optional: classfication or object detection");
+DEFINE_int32(power, 1,
+    "Optional: power of two or floating");
+
+// A simple registry for caffe commands.
+
+// A simple registry for caffe commands.
+typedef int (*BrewFunction)();
+typedef std::map<caffe::string, BrewFunction> BrewMap;
+BrewMap g_brew_map;
+
+#define RegisterBrewFunction(func) \
+namespace { \
+class __Registerer_##func { \
+ public: /* NOLINT */ \
+  __Registerer_##func() { \
+    g_brew_map[#func] = &func; \
+  } \
+}; \
+__Registerer_##func g_registerer_##func; \
+}
+
+static BrewFunction GetBrewFunction(const caffe::string& name) {
+  if (g_brew_map.count(name)) {
+    return g_brew_map[name];
+  } else {
+    LOG(ERROR) << "Available sampling actions:";
+    for (BrewMap::iterator it = g_brew_map.begin();
+         it != g_brew_map.end(); ++it) {
+      LOG(ERROR) << "\t" << it->first;
+    }
+    LOG(FATAL) << "Unknown action: " << name;
+    return NULL;  // not reachable, just to suppress old compiler warnings.
+  }
+}
+
+// To add a command, define a function "int command()" and register it with
+// RegisterBrewFunction(action);
+
+// Quantize FP32 to INT8
+int quantize(){
+  CHECK_GT(FLAGS_model.size(), 0) << "Need a model definition to score.";
+  CHECK_GT(FLAGS_weights.size(), 0) << "Need model weights to score.";
+  CHECK_GT(FLAGS_model_quantized.size(), 0) << "Need network description "
+      "output path.";
+  CHECK_GT(FLAGS_trimming_mode.size(), 0) << "Need trimming mode.";
+  Quantization* q = new Quantization(FLAGS_model, FLAGS_weights,
+      FLAGS_model_quantized, FLAGS_iterations, FLAGS_trimming_mode,
+      FLAGS_error_margin, FLAGS_score_number, FLAGS_scaling, FLAGS_detection, FLAGS_power);
+  q->QuantizeNet();
+  delete q;
+  return 0;
+}
+RegisterBrewFunction(quantize);
+
+int main(int argc, char** argv) {
+  // Print output to stderr (while still logging).
+  FLAGS_alsologtostderr = 1;
+  // Set version
+  gflags::SetVersionString(AS_STRING(CAFFE_VERSION));
+  // Usage message.
+  gflags::SetUsageMessage("command line brew\n"
+      "usage: sample <command> <args>\n\n"
+      "commands:\n"
+      "  quantize        Trim 32bit floating point net\n");
+  // Run tool or show usage.
+  caffe::GlobalInit(&argc, &argv);
+  if (argc == 2) {
+      return GetBrewFunction(caffe::string(argv[1]))();
+  } else {
+      gflags::ShowUsageWithFlagsRestrict(argv[0], "tools/sample");
+  }
+}

From 7f0083e4ab20c960fba80528dbe8fd932d6793e4 Mon Sep 17 00:00:00 2001
From: xiaolil1 <xiaoli.liu@intel.com>
Date: Wed, 3 Jan 2018 19:08:31 +0800
Subject: [PATCH 36/53] correct license in quantization code

---
 include/caffe/quant/base_quant_layer.hpp    | 2 +-
 include/caffe/quant/quantization.hpp        | 2 +-
 src/caffe/quant/layers/base_quant_layer.cpp | 2 +-
 src/caffe/quant/quantization.cpp            | 2 +-
 tools/sample.cpp                            | 2 +-
 5 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/include/caffe/quant/base_quant_layer.hpp b/include/caffe/quant/base_quant_layer.hpp
index c048ca33b..e9deacdd1 100644
--- a/include/caffe/quant/base_quant_layer.hpp
+++ b/include/caffe/quant/base_quant_layer.hpp
@@ -1,5 +1,5 @@
 /*
-All modification made by Intel Corporation: © 2016 Intel Corporation
+All modification made by Intel Corporation: © 2018 Intel Corporation
 
 All contributions by the University of California:
 Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
diff --git a/include/caffe/quant/quantization.hpp b/include/caffe/quant/quantization.hpp
index 2fc856830..0f2420be1 100644
--- a/include/caffe/quant/quantization.hpp
+++ b/include/caffe/quant/quantization.hpp
@@ -1,5 +1,5 @@
 /*
-All modification made by Intel Corporation: © 2016 Intel Corporation
+All modification made by Intel Corporation: © 2018 Intel Corporation
 
 All contributions by the University of California:
 Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
diff --git a/src/caffe/quant/layers/base_quant_layer.cpp b/src/caffe/quant/layers/base_quant_layer.cpp
index 1055adc47..ea48d2296 100644
--- a/src/caffe/quant/layers/base_quant_layer.cpp
+++ b/src/caffe/quant/layers/base_quant_layer.cpp
@@ -1,5 +1,5 @@
 /*
-All modification made by Intel Corporation: © 2016 Intel Corporation
+All modification made by Intel Corporation: © 2018 Intel Corporation
 
 All contributions by the University of California:
 Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
diff --git a/src/caffe/quant/quantization.cpp b/src/caffe/quant/quantization.cpp
index ae312869b..2344d5e40 100644
--- a/src/caffe/quant/quantization.cpp
+++ b/src/caffe/quant/quantization.cpp
@@ -1,5 +1,5 @@
 /*
-All modification made by Intel Corporation: © 2016 Intel Corporation
+All modification made by Intel Corporation: © 2018 Intel Corporation
 
 All contributions by the University of California:
 Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
diff --git a/tools/sample.cpp b/tools/sample.cpp
index d860aff6d..3212cbe9b 100644
--- a/tools/sample.cpp
+++ b/tools/sample.cpp
@@ -1,5 +1,5 @@
 /*
-All modification made by Intel Corporation: © 2016 Intel Corporation
+All modification made by Intel Corporation: © 2018 Intel Corporation
 
 All contributions by the University of California:
 Copyright (c) 2014, 2015, The Regents of the University of California (Regents)

From 74117c0aaf9da5e086a8cc40d6e46e8c9f4d6bbf Mon Sep 17 00:00:00 2001
From: Shane Li <shane.li@intel.com>
Date: Thu, 4 Jan 2018 16:01:28 +0800
Subject: [PATCH 37/53] Add correct prototxt file of resnet_50 for benchmarking

---
 .../resnet_50/solver.prototxt                    | 16 +++++++++-------
 .../resnet_50/train_val_dummydata.prototxt       | 12 ++++++++----
 2 files changed, 17 insertions(+), 11 deletions(-)

diff --git a/models/intel_optimized_models/resnet_50/solver.prototxt b/models/intel_optimized_models/resnet_50/solver.prototxt
index 2fe9feb99..bf9922187 100644
--- a/models/intel_optimized_models/resnet_50/solver.prototxt
+++ b/models/intel_optimized_models/resnet_50/solver.prototxt
@@ -1,17 +1,19 @@
 net: "models/intel_optimized_models/resnet_50/train_val.prototxt"
 test_iter: 1000
-test_interval: 1248
+test_interval: 625
 test_initialization: false
 display: 40
-base_lr: 0.4
+base_lr: 0.8
 lr_policy: "multistep"
-stepvalue:37440
-stepvalue:74880
-stepvalue:99840
+stepvalue:18750
+stepvalue:37500
+stepvalue:50000
 gamma: 0.1
-max_iter: 112600
+max_iter: 56300
+warmup_iter: 3125 # 1281167 / 2048 * 5 epochs
+warmup_start_lr: 0.1
 momentum: 0.9
 weight_decay: 0.0001
-snapshot: 12480
+snapshot: 6250
 snapshot_prefix: "models/intel_optimized_models/resnet_50/resnet_50_"
 solver_mode: CPU
diff --git a/models/intel_optimized_models/resnet_50/train_val_dummydata.prototxt b/models/intel_optimized_models/resnet_50/train_val_dummydata.prototxt
index ba298f468..15301d2b5 100644
--- a/models/intel_optimized_models/resnet_50/train_val_dummydata.prototxt
+++ b/models/intel_optimized_models/resnet_50/train_val_dummydata.prototxt
@@ -3,32 +3,36 @@ layer {
   name: "data"
   type: "DummyData"
   top: "data"
+  top: "label"
   include {
     phase: TRAIN
   }
   dummy_data_param {
-    shape: { dim: 32 dim: 3 dim: 224 dim: 224 }
     data_filler {
       type: "constant"
       value: 0.01
     }
+    shape: { dim: 32 dim: 3 dim: 224 dim: 224 }
+    shape: { dim: 32 dim: 1 dim: 1 dim: 1  }
   }
 }
 layer {
   name: "data"
   type: "DummyData"
+  top: "data"
   top: "label"
   include {
-    phase: TRAIN
+    phase: TEST
   }
   dummy_data_param {
-    shape: { dim: 32  }
     data_filler {
       type: "constant"
+      value: 0.01
     }
+    shape: { dim: 32 dim: 3 dim: 224 dim: 224 }
+    shape: { dim: 32 dim: 1 dim: 1   dim: 1   }
   }
 }
-
 layer {
 	bottom: "data"
 	top: "conv1"

From 3c5206c6fd31a344c0bdd8926c6f08a76edcf67e Mon Sep 17 00:00:00 2001
From: xiaolil1 <xiaoli.liu@intel.com>
Date: Thu, 4 Jan 2018 21:58:45 +0800
Subject: [PATCH 38/53] correct inceptionv3_int8 topology

---
 models/intel_optimized_models/int8/inceptionv3_int8.prototxt | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/models/intel_optimized_models/int8/inceptionv3_int8.prototxt b/models/intel_optimized_models/int8/inceptionv3_int8.prototxt
index ed0cbf632..d9cfbc673 100644
--- a/models/intel_optimized_models/int8/inceptionv3_int8.prototxt
+++ b/models/intel_optimized_models/int8/inceptionv3_int8.prototxt
@@ -231,10 +231,10 @@ layer {
   quantization_param {
     precision: DYNAMIC_FIXED_POINT
     bw_layer_in: 8
-    bw_layer_out: 32 #FIXME 8
+    bw_layer_out: 8
     bw_params: 8
     fl_layer_in: 6
-    fl_layer_out: 16 #FIXME 6
+    fl_layer_out: 6
     fl_params: 8
   }
 }

From 89620ab9b2422ba07a812e253b20b782f905b58d Mon Sep 17 00:00:00 2001
From: Feng Tian <feng.tian@intel.com>
Date: Fri, 5 Jan 2018 15:36:28 +0800
Subject: [PATCH 39/53] update mklml link to 01.org

---
 external/mkl/prepare_mkl.sh | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/external/mkl/prepare_mkl.sh b/external/mkl/prepare_mkl.sh
index d05340e44..f69e79423 100755
--- a/external/mkl/prepare_mkl.sh
+++ b/external/mkl/prepare_mkl.sh
@@ -74,12 +74,11 @@ echo $VERSION_LINE  # Return Version Line
 # MKL
 DST=`dirname $0`
 OMP=0 
-VERSION_MATCH=20171007
-ARCHIVE_BASENAME=mklml_lnx_2018.0.1.20171007.tgz
+VERSION_MATCH=20171227
+ARCHIVE_BASENAME=mklml_lnx_2018.0.1.20171227.tgz
 MKL_CONTENT_DIR=`echo $ARCHIVE_BASENAME | rev | cut -d "." -f 2- | rev`
-GITHUB_RELEASE_TAG=1.0.6
 
-MKLURL="https://github.com/intel/caffe/releases/download/$GITHUB_RELEASE_TAG/$ARCHIVE_BASENAME"
+MKLURL="https://github.com/01org/mkl-dnn/releases/download/v0.12/$ARCHIVE_BASENAME"
 # there are diffrent MKL lib to be used for GCC and for ICC
 reg='^[0-9]+$'
 VERSION_LINE=`GetVersionName $MKLROOT`

From c12407e7a8f7ad8255477bc316c6ddb21da71f0c Mon Sep 17 00:00:00 2001
From: "Zhang, Guoming" <guoming.zhang@intel.com>
Date: Sat, 6 Jan 2018 03:43:28 +0800
Subject: [PATCH 40/53] Add the calibration tool for int8 accuracy adjustment.

---
 include/caffe/net.hpp |   8 +-
 scripts/calibrator.py | 326 ++++++++++++++++++++++++++++++++++++++++++
 src/caffe/net.cpp     |  37 ++++-
 tools/caffe.cpp       |  11 +-
 4 files changed, 375 insertions(+), 7 deletions(-)
 create mode 100644 scripts/calibrator.py

diff --git a/include/caffe/net.hpp b/include/caffe/net.hpp
index f27f24473..e3c2e6130 100644
--- a/include/caffe/net.hpp
+++ b/include/caffe/net.hpp
@@ -66,7 +66,7 @@ class Net {
   explicit Net(const NetParameter& param, const Net* root_net = NULL);
   explicit Net(const string& param_file, Phase phase,
       const int level = 0, const vector<string>* stages = NULL,
-      const Net* root_net = NULL, std::string engine = "");
+      const Net* root_net = NULL, std::string engine = "", bool use_weights = false);
   virtual ~Net() {}
 
   /// @brief Initialize a network with a NetParameter.
@@ -312,6 +312,12 @@ class Net {
   */
   static void CompilationRuleFour(const NetParameter& param,
                              NetParameter* param_compiled);
+
+
+  /**
+  * @brief Check the input file has quantization parms or not.
+  */
+  static bool CheckWeightsHasQuantization(const string& weights);
   /**
    * @brief If find "Conv--BN--Scale" in current network, merge BN and Scale layer into Convolution
    * layers, this optimization only works in caffe TEST phase now.
diff --git a/scripts/calibrator.py b/scripts/calibrator.py
new file mode 100644
index 000000000..84cd910f7
--- /dev/null
+++ b/scripts/calibrator.py
@@ -0,0 +1,326 @@
+import os
+import sys
+import numpy
+import copy
+#os.environ['GLOG_minloglevel'] = '2'
+caffe_root="../"
+sys.path.insert(0, caffe_root + 'python')
+
+import caffe
+from caffe.proto import caffe_pb2
+import google.protobuf.text_format as txtf
+import argparse
+import subprocess
+
+def check_existence(path):
+    try:
+        return os.path.exists(path)
+    except Exception as e:
+        raise("Failed to check {} existence due to {}".format(path, str(e)))
+
+
+def setup_env():
+    os.chdir(os.path.dirname(os.path.abspath(params.root)))
+    caffe.set_mode_cpu()
+
+
+def read_prototxt(prototxt):
+    try:
+        if not check_existence(prototxt):
+            return None;
+       
+        net = caffe_pb2.NetParameter()
+       
+        with open(prototxt) as f:
+            txtf.Merge(f.read(), net)
+        
+        return net
+    
+    except Exception as e:
+        raise("Failed to read {} due to {}".format(prototxt, str(e)))
+
+
+def get_bottom_layers(layerName, net, start):
+    bottomLayers = []
+    for index, value in enumerate(net.layer[start:]):
+        for sub_index, sub_value in enumerate(value.bottom):
+            if(sub_value == layerName):
+                bottomLayers.append((index, value.name, value.type))
+
+    return bottomLayers
+
+
+def get_top_layers(l, net, end):
+    topLayers = []
+    for layerIndex in range(0, end):
+        reverseLayerIndex = end - layerIndex - 1
+        for blobIndex in range(0, len(net.layer[reverseLayerIndex].top)):
+            if (net.layer[reverseLayerIndex].top[blobIndex] in l.bottom):
+                topLayers.append((reverseLayerIndex, net.layer[reverseLayerIndex].name, net.layer[reverseLayerIndex].type))      
+    return topLayers
+
+
+def GetAllTopLayers(l, net, end, skipLayers, interestingLayers):
+    allTopLayers = []
+    topLayers = get_top_layers(l, net, end)
+    while True:
+        if len(topLayers) == 0:
+            break
+    
+        processedLayers = topLayers # sync topLayers change
+        for (li, ln, lt) in processedLayers:
+            if lt in skipLayers:
+                topLayers.remove((li, ln, lt))
+                continue
+            if lt in interestingLayers:
+                lp = (li, ln, lt)
+                topLayers.remove(lp)
+                if lp not in allTopLayers:
+                    allTopLayers.append(lp)
+                continue
+     
+            newTopLayers = get_top_layers(net.layer[li], net, li)
+            topLayers.remove((li, ln, lt))
+            topLayers.extend(newTopLayers)
+
+    return allTopLayers
+
+def GetAllBottomLayers(layerName, net, start, skipLayers, interestingLayers):
+    allBottomLayers = []
+    bottomLayers = get_bottom_layers(layerName, net, start)
+    while True:
+        if len(bottomLayers) == 0:
+            break
+    
+        processedLayers = bottomLayers # sync bottomLayers change
+        for (li, ln, lt) in processedLayers:
+            if lt in skipLayers:
+                bottomLayers.remove((li, ln, lt))
+                continue
+            if lt in interestingLayers:
+                lp = (li, ln, lt)
+                bottomLayers.remove(lp)
+                if lp not in allBottomLayers:
+                    allBottomLayers.append(lp)
+                continue
+     
+            newBottomLayers = get_bottom_layers(ln, net, li + 1)
+            bottomLayers.remove((li, ln, lt))
+            bottomLayers.extend(newBottomLayers)
+
+    return allBottomLayers
+
+
+def transform_convolutions(model_path):
+    net = caffe_pb2.NetParameter()
+    with open(model_path) as f:
+        s = f.read()
+        txtf.Merge(s, net)
+
+    newNet = copy.deepcopy(net)
+    
+    convolutionLayers = [(value, index) for index, value in enumerate(net.layer) if value.type == 'Convolution']
+
+    interestingLayers = ['ReLU']
+    skipLayers = ['Convolution', 'Eltwise', 'Concat']
+
+    u8_max = 255
+    s8_max = 127
+
+    for (l, index) in convolutionLayers:
+        outputWithRelu = GetAllBottomLayers(l.name, net, index + 1, skipLayers, interestingLayers)
+        inputWithRelu = GetAllTopLayers(l, net, index, skipLayers, interestingLayers)
+        # print "Processing", l.type, l.name
+
+        output_type = 'u8' if outputWithRelu else 's8'
+        input_type = 'u8' if inputWithRelu else 's8'
+
+        for si in range(0, len(newNet.layer[index].quantization_param.scale_out)):
+            if len(outputWithRelu) > 0: #u8
+                newNet.layer[index].quantization_param.scale_out[si] = round(u8_max / newNet.layer[index].quantization_param.scale_out[si], 2)
+            else: #s8
+                newNet.layer[index].quantization_param.scale_out[si] = round(s8_max / newNet.layer[index].quantization_param.scale_out[si], 2)
+
+        for si in range(0, len(newNet.layer[index].quantization_param.scale_in)):
+            if len(inputWithRelu) > 0: #u8
+                newNet.layer[index].quantization_param.scale_in[si] = round(u8_max / newNet.layer[index].quantization_param.scale_in[si], 2)
+            else: #s8
+                newNet.layer[index].quantization_param.scale_in[si] = round(s8_max / newNet.layer[index].quantization_param.scale_in[si], 2)
+
+        for si in range(0, len(newNet.layer[index].quantization_param.scale_params)):
+            newNet.layer[index].quantization_param.scale_params[si] = round(s8_max / newNet.layer[index].quantization_param.scale_params[si], 2)
+
+    with open(model_path, 'w') as f:
+        f.write(str(newNet))
+
+
+def generate_sample(sample_path, input_model, weights, 
+                    quantized_model, model_type, iterations=1, error_margin=1, power=0):
+    cmd = '{0} quantize -model {1} -weights {2} -model_quantized {3} -iterations {4} ' \
+          '-trimming_mode dynamic_fixed_point -error_margin {5} -power {6}'.format(sample_path, input_model, weights,
+                                                                                   quantized_model, iterations,
+                                                                                    error_margin, power)
+    if model_type == 3:
+        cmd += ' --detection=1'
+   
+    os.system(cmd)
+
+
+def get_the_accuracy(caffe_bin, model_def, model_weights, iterations, model_type):
+    output_log_name = 'calibrator_log.txt'
+    cmd = '{} test -model {} -weights {} -iterations {}'.format(caffe_bin, model_def, model_weights, iterations)
+    if model_type == 3:
+        cmd += ' -detection'
+    cmd += ' 2>&1|tee {}'.format(output_log_name)
+    os.system(cmd)
+    with open(output_log_name) as f:
+        data = f.readlines()
+    try:
+        if model_type == 1:
+            top_1 = data[-2].strip()
+            return  float(top_1.split('=')[-1].strip())
+        elif model_type == 2:
+            top_1 = data[-3].strip()
+            return float(top_1.split('=')[-1].strip())
+        elif model_type == 3:
+            top_1 = data[-1].strip()
+            return float(top_1.split('=')[-1].strip())
+    except Exception as e:
+        print 'Failed to generate accuracy due to {}'.format(str(e))
+        sys.exit(-1)
+
+
+def remove_top_quantized_parameter(current_quantized_file):
+    net = read_prototxt(current_quantized_file)
+    for i in net.layer:
+        if i.type == 'Convolution' and i.HasField('quantization_param'):
+            i.ClearField('quantization_param')
+            break
+    
+    with open(current_quantized_file, 'w') as f:
+        f.write(str(net))
+
+
+def update_caffemodel(quantized_prototxt, caffemodel_file, target_weights):
+    caffenet = caffe.Net(quantized_prototxt,
+                    caffe.TEST)
+    caffenet.copy_from(caffemodel_file)
+    caffenet.save(target_weights)
+
+
+def tuning_quantized_topology(base_top1_accuracy, quantized_file, caffe_bin,  model_weights, iterations, enable_floating_point, toleration, model_type):
+    if enable_floating_point == 0:
+        print 'Updating quantization parameter...'
+        transform_convolutions(quantized_file)
+    current_top1_accuracy = get_the_accuracy(caffe_bin, quantized_file, model_weights, iterations, model_type)
+    while abs(current_top1_accuracy - base_top1_accuracy) >= toleration:
+        print 'Tuning... '
+        print  abs(current_top1_accuracy - base_top1_accuracy)
+        remove_top_quantized_parameter(quantized_file)
+        current_top1_accuracy  = get_the_accuracy(caffe_bin, quantized_prototxt, model_weights, iterations, model_type)
+    
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser()
+
+    parser.add_argument('-i', '--iterations', action='store', dest='iterations', default=10,
+                        help='iterations')
+
+    parser.add_argument('-f', '--floatingpoint', action='store', dest='floatingpoint', default=0,
+                        help='floatingpoint')
+
+    parser.add_argument('-w', '--weights', action='store', dest='weights', default='',
+                        help='weights')
+
+    parser.add_argument('-m', '--model', action='store', dest='model', default='',
+                        help='model')
+
+    parser.add_argument('-l', '--loss', action='store', dest='loss', default=0.01,
+                        help='toleration')
+
+    parser.add_argument('-t', '--type', action='store', dest='input_model_type', default='',
+                        help='model type')
+
+    parser.add_argument('-r', '--root', action='store', dest='root', default='',
+                        help='caffe build path')
+    
+    parser.add_argument('-k', '--keep_model', action='store', dest='keep_model', default=0,
+                        help='keep_model')
+    parser.add_argument('-v', '--version', action='version', version='%(prog)s 1.0')
+
+    params = parser.parse_args()
+
+
+    try:
+        iterations = int(params.iterations)
+    except:
+        print 'Set the iterations to the default value 1000'
+        iterations = 1000
+
+    try:
+        enable_floating_point = 0 if int(params.floatingpoint) == 0 else 1
+    except:
+        print 'Enable the floating point.'
+        enable_floating_point = 0
+    try:
+        toleration = float(params.loss)
+        if toleration >= 1 or toleration < 0:
+            toleration = 0.01
+    except:
+        print 'Set the toleration to 1%.'
+        toleration = 0.01
+    
+    try:
+        keep_model = int(params.keep_model)
+    except:
+        keep_model = 0
+
+    model = os.path.abspath(params.model)
+    weights =  os.path.abspath(params.weights)
+    sample = os.path.abspath(params.root + 'tools/sample')
+    caffe_bin = os.path.abspath(params.root + 'tools/caffe')
+    setup_env()
+
+    if params.input_model_type == 'resnet':
+        model_type = 1
+    elif params.input_model_type == 'inceptionv3':
+        model_type = 2
+    elif params.input_model_type == 'ssd':
+        model_type = 3
+    else:
+        print 'Invalid model type!'
+        sys.exit(-1)
+
+
+    if check_existence(model) is False or check_existence(weights) is False or check_existence(sample) is False or check_existence(caffe_bin) is False:
+        print 'Please check model/weights/sample existence.'
+        sys.exit(-1)
+    
+    sys.path.insert(0, params.root + '../python')
+    quantized_prototxt = model.rsplit('.')[0] + '_quantized.prototxt'
+    quantized_weights = weights.rsplit('.')[0] + '_quantized.caffemodel'
+    print 'Sampling...'
+    generate_sample(sample, model, weights,
+                    quantized_prototxt, model_type, 10, 100*toleration, enable_floating_point)
+
+    print 'Sampling done'
+    print 'Generating the FP32 accuracy...'
+    top_1  = get_the_accuracy(caffe_bin, model, weights, iterations, model_type)
+    print 'FP32 accuracy is: {}'.format(top_1)
+    
+    tuning_quantized_topology(top_1, quantized_prototxt, caffe_bin,  weights, iterations,
+                             enable_floating_point, toleration, model_type)
+
+    update_caffemodel(quantized_prototxt, weights, quantized_weights)
+
+    if keep_model:
+        print 'Updated prototxt {} is generated.'.format(quantized_prototxt)
+    else:
+        try:
+            os.remove(quantized_prototxt)
+        except Exception as e:
+            print 'Failed to remove {0} due to {1}'.format(quantized_prototxt, str(e))
+    
+    print 'Updated weights {} is generated.'.format(quantized_weights)
+
+
diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
index 646b66b8d..762f3707f 100644
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -117,10 +117,14 @@ Net<Dtype>::Net(const NetParameter& param, const Net* root_net)
 template <typename Dtype>
 Net<Dtype>::Net(const string& param_file, Phase phase,
     const int level, const vector<string>* stages,
-    const Net* root_net, std::string engine)
+    const Net* root_net, std::string engine, bool use_weights)
     : root_net_(root_net) {
   NetParameter param;
-  ReadNetParamsFromTextFileOrDie(param_file, &param);
+  if(use_weights) {
+    ReadNetParamsFromBinaryFileOrDie(param_file, &param);
+   } else {
+    ReadNetParamsFromTextFileOrDie(param_file, &param);
+  }
   // Set phase, stages and level
   param.mutable_state()->set_phase(phase);
   if (stages != NULL) {
@@ -201,9 +205,16 @@ void Net<Dtype>::Init(const NetParameter& in_param) {
     param = param_with_mn;
   }
 #endif
-
+  bool has_quantization_flag = false;
+  for(int i=0; i<param.layer_size(); i++) {
+    LayerParameter* layer_param = (const_cast<NetParameter&>(param)).mutable_layer(i);
+    if (layer_param->type().compare("Convolution") == 0 && layer_param->has_quantization_param()) {
+        has_quantization_flag = true;
+        break;
+    }
+  }
   // Printing processed model
-  if (Caffe::root_solver()) {
+  if (Caffe::root_solver() && !has_quantization_flag) {
     LOG(INFO) << "Initializing net from parameters: " << std::endl;
     LOG(INFO).flush();
     fflush(0);
@@ -953,6 +964,24 @@ void Net<Dtype>::CompilationRuleFour(const NetParameter& param,
   return;
 }
 
+
+template <typename Dtype>
+bool Net<Dtype>::CheckWeightsHasQuantization(const string& weights) {
+
+    NetParameter param;
+    ReadNetParamsFromBinaryFileOrDie(weights, &param);
+
+    for(int i=0; i<param.layer_size(); i++) {
+        LayerParameter* layer_param =
+            (const_cast<NetParameter&>(param)).mutable_layer(i);
+        if (layer_param->type().compare("Convolution") == 0 && layer_param->has_quantization_param()) {
+            return true;
+        }
+    }
+
+    return false;
+}
+
 template <typename Dtype>
 void Net<Dtype>::GetBlobConsumers(
                   std::vector<const LayerParameter*>& consumer_blobs,
diff --git a/tools/caffe.cpp b/tools/caffe.cpp
index 5edfaa88a..c172f8107 100644
--- a/tools/caffe.cpp
+++ b/tools/caffe.cpp
@@ -466,8 +466,15 @@ int test() {
     Caffe::set_mode(Caffe::CPU);
   }
   // Instantiate the caffe net.
-  Net<float> caffe_net(FLAGS_model, caffe::TEST, FLAGS_level, &stages, NULL,
-                       FLAGS_engine);
+  
+  bool use_weights_as_model = Net<float>::CheckWeightsHasQuantization(FLAGS_weights);
+  string param_file = FLAGS_model;
+  if (use_weights_as_model) {
+    param_file = FLAGS_weights;
+  }
+
+  Net<float> caffe_net(param_file, caffe::TEST, FLAGS_level, &stages, NULL,
+                       FLAGS_engine, use_weights_as_model);
   caffe_net.CopyTrainedLayersFrom(FLAGS_weights);
   LOG(INFO) << "Running for " << FLAGS_iterations << " iterations.";
 

From b448ca1c14affad1ad53916598da90cccd23f10f Mon Sep 17 00:00:00 2001
From: "Zou, Feng" <feng.zou@intel.com>
Date: Sat, 6 Jan 2018 20:31:01 +0800
Subject: [PATCH 41/53] fix multinode issue by removing link of MPI lib.
 originally MPI API is mapped to mpi library incorrectly, which should be
 mapped to API in MLSL library

---
 Makefile | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/Makefile b/Makefile
index a710983d4..f0eb4c71f 100644
--- a/Makefile
+++ b/Makefile
@@ -74,9 +74,9 @@ endif
 
 	RETURN_STRING=$(shell ./external/mlsl/prepare_mlsl.sh)
 	MLSL_ROOT=$(firstword $(RETURN_STRING))
-	MLSL_LDFLAGS:=-lmpi -l$(lastword $(RETURN_STRING)) -Wl,-rpath,$(MLSL_ROOT)/intel64/lib
+	MLSL_LDFLAGS:=-l$(lastword $(RETURN_STRING)) -Wl,-rpath,$(MLSL_ROOT)/intel64/lib
 	COMMON_FLAGS += -DUSE_MLSL=1
-	LIBRARIES += mlsl mpi
+	LIBRARIES += mlsl
 	INCLUDE_DIRS += $(MLSL_ROOT)/intel64/include
 	LIBRARY_DIRS += $(MLSL_ROOT)/intel64/lib
 	COMMON_FLAGS += -DFOUNDED_MLSL_ROOT=$(MLSL_ROOT)

From b04e60f2d85885f9921c89a995af2a29406b3917 Mon Sep 17 00:00:00 2001
From: xiaolil1 <xiaoli.liu@intel.com>
Date: Sat, 6 Jan 2018 06:55:22 +0800
Subject: [PATCH 42/53] modify code to delete debug information

---
 include/caffe/layers/mkldnn_layers.hpp | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/include/caffe/layers/mkldnn_layers.hpp b/include/caffe/layers/mkldnn_layers.hpp
index b32fa0a03..659b8bcf8 100644
--- a/include/caffe/layers/mkldnn_layers.hpp
+++ b/include/caffe/layers/mkldnn_layers.hpp
@@ -62,10 +62,9 @@ namespace caffe {
 // =====  Log functions ==============================================
 template <typename Dtype>
 inline void info_mem_pd(shared_ptr<memory::primitive_desc> mem_pd, string name) {
-    // format of mem_pda
-//#ifdef DEBUG        
+#ifdef DEBUG        
     LOG(INFO) << name;
-
+    // format of mem_pd
     switch (mem_pd->desc().data.format) {
         case memory::format::nchw: LOG(INFO) << "format: nchw"; break;
         case memory::format::nhwc: LOG(INFO) << "format: nhwc"; break;
@@ -82,7 +81,7 @@ inline void info_mem_pd(shared_ptr<memory::primitive_desc> mem_pd, string name)
         case memory::data_type::s32: LOG(INFO) << "data_type: s32"; break;
         default: assert(!"Error data_type");
     }
-//#endif
+#endif
 }
 
 

From cf53da86440c20f85694722283453dff1e1bb31f Mon Sep 17 00:00:00 2001
From: "Zhang, Guoming" <guoming.zhang@intel.com>
Date: Sun, 7 Jan 2018 19:38:46 +0800
Subject: [PATCH 43/53] Revert "Merge "Add the calibration tool for int8
 accuracy adjustment.""

This reverts commit a95b33556439c142ea0e7a1341f6db8aefdbbc8b, reversing
changes made to 3c5206c6fd31a344c0bdd8926c6f08a76edcf67e.
---
 include/caffe/net.hpp |   8 +-
 scripts/calibrator.py | 326 ------------------------------------------
 src/caffe/net.cpp     |  37 +----
 tools/caffe.cpp       |  11 +-
 4 files changed, 7 insertions(+), 375 deletions(-)
 delete mode 100644 scripts/calibrator.py

diff --git a/include/caffe/net.hpp b/include/caffe/net.hpp
index e3c2e6130..f27f24473 100644
--- a/include/caffe/net.hpp
+++ b/include/caffe/net.hpp
@@ -66,7 +66,7 @@ class Net {
   explicit Net(const NetParameter& param, const Net* root_net = NULL);
   explicit Net(const string& param_file, Phase phase,
       const int level = 0, const vector<string>* stages = NULL,
-      const Net* root_net = NULL, std::string engine = "", bool use_weights = false);
+      const Net* root_net = NULL, std::string engine = "");
   virtual ~Net() {}
 
   /// @brief Initialize a network with a NetParameter.
@@ -312,12 +312,6 @@ class Net {
   */
   static void CompilationRuleFour(const NetParameter& param,
                              NetParameter* param_compiled);
-
-
-  /**
-  * @brief Check the input file has quantization parms or not.
-  */
-  static bool CheckWeightsHasQuantization(const string& weights);
   /**
    * @brief If find "Conv--BN--Scale" in current network, merge BN and Scale layer into Convolution
    * layers, this optimization only works in caffe TEST phase now.
diff --git a/scripts/calibrator.py b/scripts/calibrator.py
deleted file mode 100644
index 84cd910f7..000000000
--- a/scripts/calibrator.py
+++ /dev/null
@@ -1,326 +0,0 @@
-import os
-import sys
-import numpy
-import copy
-#os.environ['GLOG_minloglevel'] = '2'
-caffe_root="../"
-sys.path.insert(0, caffe_root + 'python')
-
-import caffe
-from caffe.proto import caffe_pb2
-import google.protobuf.text_format as txtf
-import argparse
-import subprocess
-
-def check_existence(path):
-    try:
-        return os.path.exists(path)
-    except Exception as e:
-        raise("Failed to check {} existence due to {}".format(path, str(e)))
-
-
-def setup_env():
-    os.chdir(os.path.dirname(os.path.abspath(params.root)))
-    caffe.set_mode_cpu()
-
-
-def read_prototxt(prototxt):
-    try:
-        if not check_existence(prototxt):
-            return None;
-       
-        net = caffe_pb2.NetParameter()
-       
-        with open(prototxt) as f:
-            txtf.Merge(f.read(), net)
-        
-        return net
-    
-    except Exception as e:
-        raise("Failed to read {} due to {}".format(prototxt, str(e)))
-
-
-def get_bottom_layers(layerName, net, start):
-    bottomLayers = []
-    for index, value in enumerate(net.layer[start:]):
-        for sub_index, sub_value in enumerate(value.bottom):
-            if(sub_value == layerName):
-                bottomLayers.append((index, value.name, value.type))
-
-    return bottomLayers
-
-
-def get_top_layers(l, net, end):
-    topLayers = []
-    for layerIndex in range(0, end):
-        reverseLayerIndex = end - layerIndex - 1
-        for blobIndex in range(0, len(net.layer[reverseLayerIndex].top)):
-            if (net.layer[reverseLayerIndex].top[blobIndex] in l.bottom):
-                topLayers.append((reverseLayerIndex, net.layer[reverseLayerIndex].name, net.layer[reverseLayerIndex].type))      
-    return topLayers
-
-
-def GetAllTopLayers(l, net, end, skipLayers, interestingLayers):
-    allTopLayers = []
-    topLayers = get_top_layers(l, net, end)
-    while True:
-        if len(topLayers) == 0:
-            break
-    
-        processedLayers = topLayers # sync topLayers change
-        for (li, ln, lt) in processedLayers:
-            if lt in skipLayers:
-                topLayers.remove((li, ln, lt))
-                continue
-            if lt in interestingLayers:
-                lp = (li, ln, lt)
-                topLayers.remove(lp)
-                if lp not in allTopLayers:
-                    allTopLayers.append(lp)
-                continue
-     
-            newTopLayers = get_top_layers(net.layer[li], net, li)
-            topLayers.remove((li, ln, lt))
-            topLayers.extend(newTopLayers)
-
-    return allTopLayers
-
-def GetAllBottomLayers(layerName, net, start, skipLayers, interestingLayers):
-    allBottomLayers = []
-    bottomLayers = get_bottom_layers(layerName, net, start)
-    while True:
-        if len(bottomLayers) == 0:
-            break
-    
-        processedLayers = bottomLayers # sync bottomLayers change
-        for (li, ln, lt) in processedLayers:
-            if lt in skipLayers:
-                bottomLayers.remove((li, ln, lt))
-                continue
-            if lt in interestingLayers:
-                lp = (li, ln, lt)
-                bottomLayers.remove(lp)
-                if lp not in allBottomLayers:
-                    allBottomLayers.append(lp)
-                continue
-     
-            newBottomLayers = get_bottom_layers(ln, net, li + 1)
-            bottomLayers.remove((li, ln, lt))
-            bottomLayers.extend(newBottomLayers)
-
-    return allBottomLayers
-
-
-def transform_convolutions(model_path):
-    net = caffe_pb2.NetParameter()
-    with open(model_path) as f:
-        s = f.read()
-        txtf.Merge(s, net)
-
-    newNet = copy.deepcopy(net)
-    
-    convolutionLayers = [(value, index) for index, value in enumerate(net.layer) if value.type == 'Convolution']
-
-    interestingLayers = ['ReLU']
-    skipLayers = ['Convolution', 'Eltwise', 'Concat']
-
-    u8_max = 255
-    s8_max = 127
-
-    for (l, index) in convolutionLayers:
-        outputWithRelu = GetAllBottomLayers(l.name, net, index + 1, skipLayers, interestingLayers)
-        inputWithRelu = GetAllTopLayers(l, net, index, skipLayers, interestingLayers)
-        # print "Processing", l.type, l.name
-
-        output_type = 'u8' if outputWithRelu else 's8'
-        input_type = 'u8' if inputWithRelu else 's8'
-
-        for si in range(0, len(newNet.layer[index].quantization_param.scale_out)):
-            if len(outputWithRelu) > 0: #u8
-                newNet.layer[index].quantization_param.scale_out[si] = round(u8_max / newNet.layer[index].quantization_param.scale_out[si], 2)
-            else: #s8
-                newNet.layer[index].quantization_param.scale_out[si] = round(s8_max / newNet.layer[index].quantization_param.scale_out[si], 2)
-
-        for si in range(0, len(newNet.layer[index].quantization_param.scale_in)):
-            if len(inputWithRelu) > 0: #u8
-                newNet.layer[index].quantization_param.scale_in[si] = round(u8_max / newNet.layer[index].quantization_param.scale_in[si], 2)
-            else: #s8
-                newNet.layer[index].quantization_param.scale_in[si] = round(s8_max / newNet.layer[index].quantization_param.scale_in[si], 2)
-
-        for si in range(0, len(newNet.layer[index].quantization_param.scale_params)):
-            newNet.layer[index].quantization_param.scale_params[si] = round(s8_max / newNet.layer[index].quantization_param.scale_params[si], 2)
-
-    with open(model_path, 'w') as f:
-        f.write(str(newNet))
-
-
-def generate_sample(sample_path, input_model, weights, 
-                    quantized_model, model_type, iterations=1, error_margin=1, power=0):
-    cmd = '{0} quantize -model {1} -weights {2} -model_quantized {3} -iterations {4} ' \
-          '-trimming_mode dynamic_fixed_point -error_margin {5} -power {6}'.format(sample_path, input_model, weights,
-                                                                                   quantized_model, iterations,
-                                                                                    error_margin, power)
-    if model_type == 3:
-        cmd += ' --detection=1'
-   
-    os.system(cmd)
-
-
-def get_the_accuracy(caffe_bin, model_def, model_weights, iterations, model_type):
-    output_log_name = 'calibrator_log.txt'
-    cmd = '{} test -model {} -weights {} -iterations {}'.format(caffe_bin, model_def, model_weights, iterations)
-    if model_type == 3:
-        cmd += ' -detection'
-    cmd += ' 2>&1|tee {}'.format(output_log_name)
-    os.system(cmd)
-    with open(output_log_name) as f:
-        data = f.readlines()
-    try:
-        if model_type == 1:
-            top_1 = data[-2].strip()
-            return  float(top_1.split('=')[-1].strip())
-        elif model_type == 2:
-            top_1 = data[-3].strip()
-            return float(top_1.split('=')[-1].strip())
-        elif model_type == 3:
-            top_1 = data[-1].strip()
-            return float(top_1.split('=')[-1].strip())
-    except Exception as e:
-        print 'Failed to generate accuracy due to {}'.format(str(e))
-        sys.exit(-1)
-
-
-def remove_top_quantized_parameter(current_quantized_file):
-    net = read_prototxt(current_quantized_file)
-    for i in net.layer:
-        if i.type == 'Convolution' and i.HasField('quantization_param'):
-            i.ClearField('quantization_param')
-            break
-    
-    with open(current_quantized_file, 'w') as f:
-        f.write(str(net))
-
-
-def update_caffemodel(quantized_prototxt, caffemodel_file, target_weights):
-    caffenet = caffe.Net(quantized_prototxt,
-                    caffe.TEST)
-    caffenet.copy_from(caffemodel_file)
-    caffenet.save(target_weights)
-
-
-def tuning_quantized_topology(base_top1_accuracy, quantized_file, caffe_bin,  model_weights, iterations, enable_floating_point, toleration, model_type):
-    if enable_floating_point == 0:
-        print 'Updating quantization parameter...'
-        transform_convolutions(quantized_file)
-    current_top1_accuracy = get_the_accuracy(caffe_bin, quantized_file, model_weights, iterations, model_type)
-    while abs(current_top1_accuracy - base_top1_accuracy) >= toleration:
-        print 'Tuning... '
-        print  abs(current_top1_accuracy - base_top1_accuracy)
-        remove_top_quantized_parameter(quantized_file)
-        current_top1_accuracy  = get_the_accuracy(caffe_bin, quantized_prototxt, model_weights, iterations, model_type)
-    
-
-if __name__ == '__main__':
-    parser = argparse.ArgumentParser()
-
-    parser.add_argument('-i', '--iterations', action='store', dest='iterations', default=10,
-                        help='iterations')
-
-    parser.add_argument('-f', '--floatingpoint', action='store', dest='floatingpoint', default=0,
-                        help='floatingpoint')
-
-    parser.add_argument('-w', '--weights', action='store', dest='weights', default='',
-                        help='weights')
-
-    parser.add_argument('-m', '--model', action='store', dest='model', default='',
-                        help='model')
-
-    parser.add_argument('-l', '--loss', action='store', dest='loss', default=0.01,
-                        help='toleration')
-
-    parser.add_argument('-t', '--type', action='store', dest='input_model_type', default='',
-                        help='model type')
-
-    parser.add_argument('-r', '--root', action='store', dest='root', default='',
-                        help='caffe build path')
-    
-    parser.add_argument('-k', '--keep_model', action='store', dest='keep_model', default=0,
-                        help='keep_model')
-    parser.add_argument('-v', '--version', action='version', version='%(prog)s 1.0')
-
-    params = parser.parse_args()
-
-
-    try:
-        iterations = int(params.iterations)
-    except:
-        print 'Set the iterations to the default value 1000'
-        iterations = 1000
-
-    try:
-        enable_floating_point = 0 if int(params.floatingpoint) == 0 else 1
-    except:
-        print 'Enable the floating point.'
-        enable_floating_point = 0
-    try:
-        toleration = float(params.loss)
-        if toleration >= 1 or toleration < 0:
-            toleration = 0.01
-    except:
-        print 'Set the toleration to 1%.'
-        toleration = 0.01
-    
-    try:
-        keep_model = int(params.keep_model)
-    except:
-        keep_model = 0
-
-    model = os.path.abspath(params.model)
-    weights =  os.path.abspath(params.weights)
-    sample = os.path.abspath(params.root + 'tools/sample')
-    caffe_bin = os.path.abspath(params.root + 'tools/caffe')
-    setup_env()
-
-    if params.input_model_type == 'resnet':
-        model_type = 1
-    elif params.input_model_type == 'inceptionv3':
-        model_type = 2
-    elif params.input_model_type == 'ssd':
-        model_type = 3
-    else:
-        print 'Invalid model type!'
-        sys.exit(-1)
-
-
-    if check_existence(model) is False or check_existence(weights) is False or check_existence(sample) is False or check_existence(caffe_bin) is False:
-        print 'Please check model/weights/sample existence.'
-        sys.exit(-1)
-    
-    sys.path.insert(0, params.root + '../python')
-    quantized_prototxt = model.rsplit('.')[0] + '_quantized.prototxt'
-    quantized_weights = weights.rsplit('.')[0] + '_quantized.caffemodel'
-    print 'Sampling...'
-    generate_sample(sample, model, weights,
-                    quantized_prototxt, model_type, 10, 100*toleration, enable_floating_point)
-
-    print 'Sampling done'
-    print 'Generating the FP32 accuracy...'
-    top_1  = get_the_accuracy(caffe_bin, model, weights, iterations, model_type)
-    print 'FP32 accuracy is: {}'.format(top_1)
-    
-    tuning_quantized_topology(top_1, quantized_prototxt, caffe_bin,  weights, iterations,
-                             enable_floating_point, toleration, model_type)
-
-    update_caffemodel(quantized_prototxt, weights, quantized_weights)
-
-    if keep_model:
-        print 'Updated prototxt {} is generated.'.format(quantized_prototxt)
-    else:
-        try:
-            os.remove(quantized_prototxt)
-        except Exception as e:
-            print 'Failed to remove {0} due to {1}'.format(quantized_prototxt, str(e))
-    
-    print 'Updated weights {} is generated.'.format(quantized_weights)
-
-
diff --git a/src/caffe/net.cpp b/src/caffe/net.cpp
index 762f3707f..646b66b8d 100644
--- a/src/caffe/net.cpp
+++ b/src/caffe/net.cpp
@@ -117,14 +117,10 @@ Net<Dtype>::Net(const NetParameter& param, const Net* root_net)
 template <typename Dtype>
 Net<Dtype>::Net(const string& param_file, Phase phase,
     const int level, const vector<string>* stages,
-    const Net* root_net, std::string engine, bool use_weights)
+    const Net* root_net, std::string engine)
     : root_net_(root_net) {
   NetParameter param;
-  if(use_weights) {
-    ReadNetParamsFromBinaryFileOrDie(param_file, &param);
-   } else {
-    ReadNetParamsFromTextFileOrDie(param_file, &param);
-  }
+  ReadNetParamsFromTextFileOrDie(param_file, &param);
   // Set phase, stages and level
   param.mutable_state()->set_phase(phase);
   if (stages != NULL) {
@@ -205,16 +201,9 @@ void Net<Dtype>::Init(const NetParameter& in_param) {
     param = param_with_mn;
   }
 #endif
-  bool has_quantization_flag = false;
-  for(int i=0; i<param.layer_size(); i++) {
-    LayerParameter* layer_param = (const_cast<NetParameter&>(param)).mutable_layer(i);
-    if (layer_param->type().compare("Convolution") == 0 && layer_param->has_quantization_param()) {
-        has_quantization_flag = true;
-        break;
-    }
-  }
+
   // Printing processed model
-  if (Caffe::root_solver() && !has_quantization_flag) {
+  if (Caffe::root_solver()) {
     LOG(INFO) << "Initializing net from parameters: " << std::endl;
     LOG(INFO).flush();
     fflush(0);
@@ -964,24 +953,6 @@ void Net<Dtype>::CompilationRuleFour(const NetParameter& param,
   return;
 }
 
-
-template <typename Dtype>
-bool Net<Dtype>::CheckWeightsHasQuantization(const string& weights) {
-
-    NetParameter param;
-    ReadNetParamsFromBinaryFileOrDie(weights, &param);
-
-    for(int i=0; i<param.layer_size(); i++) {
-        LayerParameter* layer_param =
-            (const_cast<NetParameter&>(param)).mutable_layer(i);
-        if (layer_param->type().compare("Convolution") == 0 && layer_param->has_quantization_param()) {
-            return true;
-        }
-    }
-
-    return false;
-}
-
 template <typename Dtype>
 void Net<Dtype>::GetBlobConsumers(
                   std::vector<const LayerParameter*>& consumer_blobs,
diff --git a/tools/caffe.cpp b/tools/caffe.cpp
index c172f8107..5edfaa88a 100644
--- a/tools/caffe.cpp
+++ b/tools/caffe.cpp
@@ -466,15 +466,8 @@ int test() {
     Caffe::set_mode(Caffe::CPU);
   }
   // Instantiate the caffe net.
-  
-  bool use_weights_as_model = Net<float>::CheckWeightsHasQuantization(FLAGS_weights);
-  string param_file = FLAGS_model;
-  if (use_weights_as_model) {
-    param_file = FLAGS_weights;
-  }
-
-  Net<float> caffe_net(param_file, caffe::TEST, FLAGS_level, &stages, NULL,
-                       FLAGS_engine, use_weights_as_model);
+  Net<float> caffe_net(FLAGS_model, caffe::TEST, FLAGS_level, &stages, NULL,
+                       FLAGS_engine);
   caffe_net.CopyTrainedLayersFrom(FLAGS_weights);
   LOG(INFO) << "Running for " << FLAGS_iterations << " iterations.";
 

From 22270ae854b150e3c0be735a6caac8bce56b4808 Mon Sep 17 00:00:00 2001
From: "Zhang, Guoming" <guoming.zhang@intel.com>
Date: Sun, 7 Jan 2018 22:46:20 +0800
Subject: [PATCH 44/53] Add int8 accuracy calibration script.

---
 scripts/calibrator.py | 344 ++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 344 insertions(+)
 create mode 100644 scripts/calibrator.py

diff --git a/scripts/calibrator.py b/scripts/calibrator.py
new file mode 100644
index 000000000..7dcb7c54a
--- /dev/null
+++ b/scripts/calibrator.py
@@ -0,0 +1,344 @@
+#!/usr/bin/env python
+# 
+# All modification made by Intel Corporation: Copyright (c) 2018 Intel Corporation
+# 
+# All contributions by the University of California:
+# Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
+# All rights reserved.
+# 
+# All other contributions:
+# Copyright (c) 2014, 2015, the respective contributors
+# All rights reserved.
+# For the list of contributors go to https://github.com/BVLC/caffe/blob/master/CONTRIBUTORS.md
+# 
+# 
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions are met:
+# 
+#     * Redistributions of source code must retain the above copyright notice,
+#       this list of conditions and the following disclaimer.
+#     * Redistributions in binary form must reproduce the above copyright
+#       notice, this list of conditions and the following disclaimer in the
+#       documentation and/or other materials provided with the distribution.
+#     * Neither the name of Intel Corporation nor the names of its contributors
+#       may be used to endorse or promote products derived from this software
+#       without specific prior written permission.
+# 
+# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
+# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+# SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+# OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+#
+import os
+import sys
+import copy
+import argparse
+
+caffe_root = "../"
+sys.path.insert(0, caffe_root + 'python')
+
+import caffe
+from caffe.proto import caffe_pb2
+import google.protobuf.text_format as txtf
+
+
+def check_existence(path):
+    try:
+        return os.path.exists(path)
+    except Exception as e:
+        raise ("Failed to check {} existence due to {}".format(path, str(e)))
+
+
+def setup_env():
+    os.chdir(os.path.dirname(os.path.abspath(params.root)))
+    caffe.set_mode_cpu()
+
+
+def read_prototxt(prototxt):
+    try:
+        if not check_existence(prototxt):
+            return None
+
+        net = caffe_pb2.NetParameter()
+
+        with open(prototxt) as f:
+            txtf.Merge(f.read(), net)
+
+        return net
+
+    except Exception as e:
+        raise ("Failed to read {} due to {}".format(prototxt, str(e)))
+
+
+def get_bottom_layers(layer_name, net, start):
+    bottom_layers = []
+    for index, value in enumerate(net.layer[start:]):
+        for sub_index, sub_value in enumerate(value.bottom):
+            if sub_value == layer_name:
+                bottom_layers.append((index, value.name, value.type))
+
+    return bottom_layers
+
+
+def get_top_layers(l, net, end):
+    top_layers = []
+    for layerIndex in range(0, end):
+        reverse_layer_index = end - layerIndex - 1
+        for blobIndex in range(0, len(net.layer[reverse_layer_index].top)):
+            if net.layer[reverse_layer_index].top[blobIndex] in l.bottom:
+                top_layers.append((reverse_layer_index, net.layer[reverse_layer_index].name,
+                                   net.layer[reverse_layer_index].type))
+    return top_layers
+
+
+def get_all_top_layers(l, net, end, skip_layers, interesting_layers):
+    all_top_layers = []
+    top_layers = get_top_layers(l, net, end)
+    while True:
+        if len(top_layers) == 0:
+            break
+
+        processed_layers = top_layers  # sync topLayers change
+        for (li, ln, lt) in processed_layers:
+            if lt in skip_layers:
+                top_layers.remove((li, ln, lt))
+                continue
+            if lt in interesting_layers:
+                lp = (li, ln, lt)
+                top_layers.remove(lp)
+                if lp not in all_top_layers:
+                    all_top_layers.append(lp)
+                continue
+
+            new_top_layers = get_top_layers(net.layer[li], net, li)
+            top_layers.remove((li, ln, lt))
+            top_layers.extend(new_top_layers)
+
+    return all_top_layers
+
+
+def get_all_bottom_layers(layer_name, net, start, skip_layers, interesting_layers):
+    all_bottom_layers = []
+    bottom_layers = get_bottom_layers(layer_name, net, start)
+    while True:
+        if len(bottom_layers) == 0:
+            break
+
+        processed_layers = bottom_layers  # sync bottom_layers change
+        for (li, ln, lt) in processed_layers:
+            if lt in skip_layers:
+                bottom_layers.remove((li, ln, lt))
+                continue
+            if lt in interesting_layers:
+                lp = (li, ln, lt)
+                bottom_layers.remove(lp)
+                if lp not in all_bottom_layers:
+                    all_bottom_layers.append(lp)
+                continue
+
+            new_bottom_layers = get_bottom_layers(ln, net, li + 1)
+            bottom_layers.remove((li, ln, lt))
+            bottom_layers.extend(new_bottom_layers)
+
+    return all_bottom_layers
+
+
+def transform_convolutions(model_path):
+    net = caffe_pb2.NetParameter()
+    with open(model_path) as f:
+        s = f.read()
+        txtf.Merge(s, net)
+
+    new_net = copy.deepcopy(net)
+
+    convolution_layers = [(value, index) for index, value in enumerate(net.layer) if value.type == 'Convolution']
+
+    interesting_layers = ['ReLU']
+    skip_layers = ['Convolution', 'Eltwise', 'Concat']
+
+    u8_max = 255
+    s8_max = 127
+
+    for (l, index) in convolution_layers:
+        outputwith_relu = get_all_bottom_layers(l.name, net, index + 1, skip_layers, interesting_layers)
+        inputwith_relu = get_all_top_layers(l, net, index, skip_layers, interesting_layers)
+        # print "Processing", l.type, l.name
+
+        # output_type = 'u8' if outputwith_relu else 's8'
+        # input_type = 'u8' if inputwith_relu else 's8'
+
+        for si in range(0, len(new_net.layer[index].quantization_param.scale_out)):
+            if len(outputwith_relu) > 0:  # u8
+                new_net.layer[index].quantization_param.scale_out[si] = round(u8_max / new_net.layer[index].
+                                                                              quantization_param.scale_out[si], 2)
+            else:  # s8
+                new_net.layer[index].quantization_param.scale_out[si] = round(s8_max / new_net.layer[index].
+                                                                              quantization_param.scale_out[si], 2)
+
+        for si in range(0, len(new_net.layer[index].quantization_param.scale_in)):
+            if len(inputwith_relu) > 0:  # u8
+                new_net.layer[index].quantization_param.scale_in[si] = round(u8_max / new_net.layer[index].
+                                                                             quantization_param.scale_in[si], 2)
+            else:  # s8
+                new_net.layer[index].quantization_param.scale_in[si] = round(s8_max / new_net.layer[index].
+                                                                             quantization_param.scale_in[si], 2)
+
+        for si in range(0, len(new_net.layer[index].quantization_param.scale_params)):
+            new_net.layer[index].quantization_param.scale_params[si] = round(s8_max / new_net.layer[index].
+                                                                             quantization_param.scale_params[si], 2)
+
+    with open(model_path, 'w') as f:
+        f.write(str(new_net))
+
+
+def generate_sample(sample_path, input_model, weights,
+                    quantized_model, model_type, iterations=1, error_margin=1, power=0):
+    cmd = '{0} quantize -model {1} -weights {2} -model_quantized {3} -iterations {4} ' \
+          '-trimming_mode dynamic_fixed_point -error_margin {5} -power {6}'.format(sample_path, input_model, weights,
+                                                                                   quantized_model, iterations,
+                                                                                   error_margin, power)
+    if model_type == 3:
+        cmd += ' --detection=1'
+
+    os.system(cmd)
+
+
+def get_the_accuracy(caffe_bin, model_def, model_weights, iterations, model_type):
+    output_log_name = 'calibrator_log.txt'
+    cmd = '{} test -model {} -weights {} -iterations {}'.format(caffe_bin, model_def, model_weights, iterations)
+    if model_type == 3:
+        cmd += ' -detection'
+    cmd += ' 2>&1|tee {}'.format(output_log_name)
+    os.system(cmd)
+    with open(output_log_name) as f:
+        data = f.readlines()
+    try:
+        if model_type == 1:
+            top_1 = data[-2].strip()
+            return float(top_1.split('=')[-1].strip())
+        elif model_type == 2:
+            top_1 = data[-3].strip()
+            return float(top_1.split('=')[-1].strip())
+        elif model_type == 3:
+            top_1 = data[-1].strip()
+            return float(top_1.split('=')[-1].strip())
+    except Exception as e:
+        print 'Failed to generate accuracy due to {}'.format(str(e))
+        sys.exit(-1)
+
+
+def remove_top_quantized_parameter(current_quantized_file):
+    net = read_prototxt(current_quantized_file)
+    for i in net.layer:
+        if i.type == 'Convolution' and i.HasField('quantization_param'):
+            i.ClearField('quantization_param')
+            break
+
+    with open(current_quantized_file, 'w') as f:
+        f.write(str(net))
+
+
+def tuning_quantized_topology(base_top1_accuracy, quantized_file, caffe_bin, model_weights, iterations,
+                              enable_floating_point, toleration, model_type):
+    if enable_floating_point == 0:
+        print 'Updating quantization parameter...'
+        transform_convolutions(quantized_file)
+    current_top1_accuracy = get_the_accuracy(caffe_bin, quantized_file, model_weights, iterations, model_type)
+    while abs(current_top1_accuracy - base_top1_accuracy) >= toleration:
+        print 'Tuning... '
+        print abs(current_top1_accuracy - base_top1_accuracy)
+        remove_top_quantized_parameter(quantized_file)
+        current_top1_accuracy = get_the_accuracy(caffe_bin, quantized_prototxt, model_weights, iterations, model_type)
+
+
+if __name__ == '__main__':
+    usage_string = 'Usage: 1.Build the caffe\n ' \
+                   '2.cd /path/to/caffe/scripts\n ' \
+                   '3.python calibrator.py ' \
+                   ' -r /path/to/caffe/build ' \
+                   ' -w pre-trained-fp32 weights ' \
+                   ' -m typology ' \
+                   ' -i iterations ' \
+                   ' -t resnet|inceptionv3|ssd\n '
+
+    parser = argparse.ArgumentParser(add_help=False)
+    parser.add_argument('-h', '--help', action='help', help=usage_string)
+
+    parser.add_argument('-i', '--iterations', action='store', dest='iterations', default=10,
+                        help='iterations')
+
+    parser.add_argument('-w', '--weights', action='store', dest='weights', default='',
+                        help='pre-trained-fp32-weights')
+
+    parser.add_argument('-m', '--model', action='store', dest='model', default='',
+                        help='model')
+
+    parser.add_argument('-l', '--accuracy_loss', action='store', dest='loss', default=0.01,
+                        help='accuracy-loss')
+
+    parser.add_argument('-t', '--type', action='store', dest='input_model_type', default='',
+                        help='model type')
+
+    parser.add_argument('-r', '--root', action='store', dest='root', default='',
+                        help='caffe build path')
+    
+    params = parser.parse_args()
+
+    try:
+        iterations = int(params.iterations)
+    except:
+        print 'Set the iterations to the default value 1000'
+        iterations = 1000
+
+    try:
+        toleration = float(params.loss)
+        if toleration >= 1 or toleration < 0:
+            toleration = 0.01
+    except:
+        print 'Set the toleration to 1%.'
+        toleration = 0.01
+
+    model = os.path.abspath(params.model)
+    weights = os.path.abspath(params.weights)
+    sample = os.path.abspath(params.root + 'tools/sample')
+    caffe_bin = os.path.abspath(params.root + 'tools/caffe')
+    setup_env()
+
+    if params.input_model_type == 'resnet':
+        model_type = 1
+    elif params.input_model_type == 'inceptionv3':
+        model_type = 2
+    elif params.input_model_type == 'ssd':
+        model_type = 3
+    else:
+        print 'Invalid model type!'
+        sys.exit(-1)
+
+    if check_existence(model) is False or check_existence(weights) is False or check_existence(sample) is False or \
+            check_existence(caffe_bin) is False:
+        print 'Please check model/weights/sample existence.'
+        sys.exit(-1)
+
+    sys.path.insert(0, params.root + '../python')
+    quantized_prototxt = model.rsplit('.')[0] + '_quantized.prototxt'
+    quantized_weights = weights.rsplit('.')[0] + '_quantized.caffemodel'
+    enable_floating_point = 0
+    print 'Sampling...'
+    generate_sample(sample, model, weights,
+                    quantized_prototxt, model_type, 10, 100 * toleration, enable_floating_point)
+
+    print 'Sampling done'
+    print 'Generating the FP32 accuracy...'
+    top_1 = get_the_accuracy(caffe_bin, model, weights, iterations, model_type)
+    print 'FP32 accuracy is: {}'.format(top_1)
+
+    tuning_quantized_topology(top_1, quantized_prototxt, caffe_bin, weights, iterations, enable_floating_point,
+                              toleration, model_type)
+
+    print 'Updated prototxt {} is generated.'.format(quantized_prototxt)

From 2edff64e35119d49fb22b6b1d81f8fae3858060f Mon Sep 17 00:00:00 2001
From: "Yu, Chong" <chong.yu@intel.com>
Date: Mon, 8 Jan 2018 00:43:27 +0800
Subject: [PATCH 45/53] Update MKLDNN version to
 ae00102be506ed0fe2099c6557df2aa88ad57ec1.

---
 mkldnn.commit | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/mkldnn.commit b/mkldnn.commit
index 49f70144e..4925f6349 100644
--- a/mkldnn.commit
+++ b/mkldnn.commit
@@ -1 +1 @@
-aab753280e83137ba955f8f19d72cb6aaba545ef
\ No newline at end of file
+ae00102be506ed0fe2099c6557df2aa88ad57ec1
\ No newline at end of file

From f9ae217ba23965d46d15cc5506c6327068e332a6 Mon Sep 17 00:00:00 2001
From: xiaolil1 <xiaoli.liu@intel.com>
Date: Mon, 8 Jan 2018 16:57:19 +0800
Subject: [PATCH 46/53] change int8 model to new floating point model and add
 resnet-50 sparse model

---
 .../int8/inceptionv3_int8.prototxt            | 1163 ++++---
 .../int8/resnet50_int8.prototxt               |  424 +--
 .../int8/resnet50_sparse_int8.prototxt        | 3099 +++++++++++++++++
 .../int8/ssd_int8.prototxt                    |  720 ++--
 4 files changed, 4325 insertions(+), 1081 deletions(-)
 create mode 100644 models/intel_optimized_models/int8/resnet50_sparse_int8.prototxt

diff --git a/models/intel_optimized_models/int8/inceptionv3_int8.prototxt b/models/intel_optimized_models/int8/inceptionv3_int8.prototxt
index d9cfbc673..70a52b698 100644
--- a/models/intel_optimized_models/int8/inceptionv3_int8.prototxt
+++ b/models/intel_optimized_models/int8/inceptionv3_int8.prototxt
@@ -35,8 +35,8 @@ layer {
   bottom: "data"
   top: "conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 32
@@ -46,7 +46,7 @@ layer {
     stride: 2
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
 }
@@ -70,8 +70,8 @@ layer {
   bottom: "conv_conv2d_relu"
   top: "conv_1_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 32
@@ -81,7 +81,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -89,9 +89,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 5
-    fl_params: 6
+    scale_in: 75.3399963379
+    scale_out: 24.3700008392
+    scale_params: 125.419998169
   }
 }
 layer {
@@ -114,8 +114,8 @@ layer {
   bottom: "conv_1_1_conv2d_relu"
   top: "conv_2_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 64
@@ -125,7 +125,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -133,9 +133,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 5
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 48.9399986267
+    scale_out: 33.9199981689
+    scale_params: 238.300003052
   }
 }
 layer {
@@ -170,8 +170,8 @@ layer {
   bottom: "pool"
   top: "conv_3_3_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 80
@@ -181,7 +181,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -189,9 +189,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 6
+    scale_in: 68.1200027466
+    scale_out: 37.0099983215
+    scale_params: 115.459999084
   }
 }
 layer {
@@ -214,8 +214,8 @@ layer {
   bottom: "conv_3_3_conv2d_relu"
   top: "conv_4_4_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -225,7 +225,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -233,9 +233,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 8
+    scale_in: 74.3199996948
+    scale_out: 61.7999992371
+    scale_params: 490.480010986
   }
 }
 layer {
@@ -270,8 +270,8 @@ layer {
   bottom: "pool1"
   top: "mixed_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 64
@@ -281,7 +281,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -289,9 +289,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 124.080001831
+    scale_out: 62.7400016785
+    scale_params: 239.179992676
   }
 }
 layer {
@@ -314,8 +314,8 @@ layer {
   bottom: "pool1"
   top: "mixed_tower_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 48
@@ -325,7 +325,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -333,9 +333,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 124.080001831
+    scale_out: 79.2399978638
+    scale_params: 303.589996338
   }
 }
 layer {
@@ -358,8 +358,8 @@ layer {
   bottom: "mixed_tower_conv_conv2d_relu"
   top: "mixed_tower_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 64
@@ -369,7 +369,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -377,9 +377,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 159.11000061
+    scale_out: 69.2699966431
+    scale_params: 495.859985352
   }
 }
 layer {
@@ -402,8 +402,8 @@ layer {
   bottom: "pool1"
   top: "mixed_tower_1_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 64
@@ -413,7 +413,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -421,9 +421,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 124.080001831
+    scale_out: 72.8399963379
+    scale_params: 215.38999939
   }
 }
 layer {
@@ -446,8 +446,8 @@ layer {
   bottom: "mixed_tower_1_conv_conv2d_relu"
   top: "mixed_tower_1_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 96
@@ -457,7 +457,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -465,9 +465,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 146.25
+    scale_out: 85.2699966431
+    scale_params: 322.309997559
   }
 }
 layer {
@@ -490,8 +490,8 @@ layer {
   bottom: "mixed_tower_1_conv_1_conv2d_relu"
   top: "mixed_tower_1_conv_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 96
@@ -501,7 +501,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -509,9 +509,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 6
-    fl_params: 8
+    scale_in: 171.210006714
+    scale_out: 57.8400001526
+    scale_params: 303.209991455
   }
 }
 layer {
@@ -546,8 +546,8 @@ layer {
   bottom: "AVE_pool_mixed_pool"
   top: "mixed_tower_2_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 32
@@ -557,7 +557,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -565,9 +565,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 164.720001221
+    scale_out: 87.5400009155
+    scale_params: 160.130004883
   }
 }
 layer {
@@ -602,8 +602,8 @@ layer {
   bottom: "ch_concat_mixed_chconcat"
   top: "mixed_1_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 64
@@ -613,7 +613,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -621,9 +621,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 57.8400001526
+    scale_out: 63.8800010681
+    scale_params: 229.300003052
   }
 }
 layer {
@@ -646,8 +646,8 @@ layer {
   bottom: "ch_concat_mixed_chconcat"
   top: "mixed_1_tower_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 48
@@ -657,7 +657,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -665,9 +665,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 57.8400001526
+    scale_out: 48.7599983215
+    scale_params: 171.490005493
   }
 }
 layer {
@@ -690,8 +690,8 @@ layer {
   bottom: "mixed_1_tower_conv_conv2d_relu"
   top: "mixed_1_tower_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 64
@@ -701,7 +701,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -709,9 +709,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 9
+    scale_in: 97.9100036621
+    scale_out: 54.2099990845
+    scale_params: 516.630004883
   }
 }
 layer {
@@ -734,8 +734,8 @@ layer {
   bottom: "ch_concat_mixed_chconcat"
   top: "mixed_1_tower_1_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 64
@@ -745,7 +745,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -753,9 +753,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 57.8400001526
+    scale_out: 77.5999984741
+    scale_params: 194.460006714
   }
 }
 layer {
@@ -778,8 +778,8 @@ layer {
   bottom: "mixed_1_tower_1_conv_conv2d_relu"
   top: "mixed_1_tower_1_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 96
@@ -789,7 +789,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -797,9 +797,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 155.809997559
+    scale_out: 100.75
+    scale_params: 243.229995728
   }
 }
 layer {
@@ -822,8 +822,8 @@ layer {
   bottom: "mixed_1_tower_1_conv_1_conv2d_relu"
   top: "mixed_1_tower_1_conv_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 96
@@ -833,7 +833,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -841,9 +841,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 6
-    fl_params: 6
+    scale_in: 202.300003052
+    scale_out: 52.8199996948
+    scale_params: 90.2200012207
   }
 }
 layer {
@@ -878,8 +878,8 @@ layer {
   bottom: "AVE_pool_mixed_1_pool"
   top: "mixed_1_tower_2_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 64
@@ -889,7 +889,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -897,9 +897,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 80.2900009155
+    scale_out: 100.050003052
+    scale_params: 146.809997559
   }
 }
 layer {
@@ -934,8 +934,8 @@ layer {
   bottom: "ch_concat_mixed_1_chconcat"
   top: "mixed_2_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 64
@@ -945,7 +945,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -953,9 +953,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 52.8199996948
+    scale_out: 78.9400024414
+    scale_params: 251.970001221
   }
 }
 layer {
@@ -978,8 +978,8 @@ layer {
   bottom: "ch_concat_mixed_1_chconcat"
   top: "mixed_2_tower_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 48
@@ -989,7 +989,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -997,9 +997,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 52.8199996948
+    scale_out: 50.7700004578
+    scale_params: 211.789993286
   }
 }
 layer {
@@ -1022,8 +1022,8 @@ layer {
   bottom: "mixed_2_tower_conv_conv2d_relu"
   top: "mixed_2_tower_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 64
@@ -1033,7 +1033,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1041,9 +1041,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 9
+    scale_in: 101.940002441
+    scale_out: 62.0
+    scale_params: 537.25
   }
 }
 layer {
@@ -1066,8 +1066,8 @@ layer {
   bottom: "ch_concat_mixed_1_chconcat"
   top: "mixed_2_tower_1_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 64
@@ -1077,7 +1077,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1085,9 +1085,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 52.8199996948
+    scale_out: 80.1200027466
+    scale_params: 225.440002441
   }
 }
 layer {
@@ -1110,8 +1110,8 @@ layer {
   bottom: "mixed_2_tower_1_conv_conv2d_relu"
   top: "mixed_2_tower_1_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 96
@@ -1121,7 +1121,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1129,9 +1129,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 160.86000061
+    scale_out: 62.7799987793
+    scale_params: 141.570007324
   }
 }
 layer {
@@ -1154,8 +1154,8 @@ layer {
   bottom: "mixed_2_tower_1_conv_1_conv2d_relu"
   top: "mixed_2_tower_1_conv_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 96
@@ -1165,7 +1165,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1173,9 +1173,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 126.050003052
+    scale_out: 65.6800003052
+    scale_params: 423.859985352
   }
 }
 layer {
@@ -1210,8 +1210,8 @@ layer {
   bottom: "AVE_pool_mixed_2_pool"
   top: "mixed_2_tower_2_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 64
@@ -1221,7 +1221,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1229,9 +1229,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 85.0
+    scale_out: 95.9300003052
+    scale_params: 127.099998474
   }
 }
 layer {
@@ -1266,8 +1266,8 @@ layer {
   bottom: "ch_concat_mixed_2_chconcat"
   top: "mixed_3_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 384
@@ -1277,7 +1277,7 @@ layer {
     stride: 2
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1285,9 +1285,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 62.0
+    scale_out: 76.8199996948
+    scale_params: 251.36000061
   }
 }
 layer {
@@ -1310,8 +1310,8 @@ layer {
   bottom: "ch_concat_mixed_2_chconcat"
   top: "mixed_3_tower_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 64
@@ -1321,7 +1321,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1329,9 +1329,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 62.0
+    scale_out: 96.2900009155
+    scale_params: 278.760009766
   }
 }
 layer {
@@ -1354,8 +1354,8 @@ layer {
   bottom: "mixed_3_tower_conv_conv2d_relu"
   top: "mixed_3_tower_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 96
@@ -1365,7 +1365,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1373,9 +1373,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 8
-    fl_params: 8
+    scale_in: 193.350006104
+    scale_out: 132.729995728
+    scale_params: 457.459991455
   }
 }
 layer {
@@ -1398,8 +1398,8 @@ layer {
   bottom: "mixed_3_tower_conv_1_conv2d_relu"
   top: "mixed_3_tower_conv_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 96
@@ -1409,7 +1409,7 @@ layer {
     stride: 2
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1417,9 +1417,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 8
-    fl_layer_out: 6
-    fl_params: 8
+    scale_in: 266.5
+    scale_out: 58.7700004578
+    scale_params: 270.910003662
   }
 }
 layer {
@@ -1465,8 +1465,8 @@ layer {
   bottom: "ch_concat_mixed_3_chconcat"
   top: "mixed_4_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -1476,7 +1476,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1484,9 +1484,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 58.7700004578
+    scale_out: 75.8399963379
+    scale_params: 153.630004883
   }
 }
 layer {
@@ -1509,8 +1509,8 @@ layer {
   bottom: "ch_concat_mixed_3_chconcat"
   top: "mixed_4_tower_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 128
@@ -1520,7 +1520,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1528,9 +1528,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 58.7700004578
+    scale_out: 55.1300010681
+    scale_params: 182.440002441
   }
 }
 layer {
@@ -1553,8 +1553,8 @@ layer {
   bottom: "mixed_4_tower_conv_conv2d_relu"
   top: "mixed_4_tower_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 128
@@ -1562,7 +1562,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 3
@@ -1574,9 +1574,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 110.699996948
+    scale_out: 48.0499992371
+    scale_params: 157.910003662
   }
 }
 layer {
@@ -1599,8 +1599,8 @@ layer {
   bottom: "mixed_4_tower_conv_1_conv2d_relu"
   top: "mixed_4_tower_conv_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -1608,7 +1608,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 3
     pad_w: 0
@@ -1620,9 +1620,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 96.4899978638
+    scale_out: 62.3899993896
+    scale_params: 241.160003662
   }
 }
 layer {
@@ -1645,8 +1645,8 @@ layer {
   bottom: "ch_concat_mixed_3_chconcat"
   top: "mixed_4_tower_1_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 128
@@ -1656,7 +1656,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1664,9 +1664,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 8
-    fl_params: 8
+    scale_in: 58.7700004578
+    scale_out: 145.690002441
+    scale_params: 284.149993896
   }
 }
 layer {
@@ -1689,8 +1689,8 @@ layer {
   bottom: "mixed_4_tower_1_conv_conv2d_relu"
   top: "mixed_4_tower_1_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 128
@@ -1698,7 +1698,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 3
     pad_w: 0
@@ -1710,9 +1710,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 8
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 292.529998779
+    scale_out: 125.720001221
+    scale_params: 290.660003662
   }
 }
 layer {
@@ -1735,8 +1735,8 @@ layer {
   bottom: "mixed_4_tower_1_conv_1_conv2d_relu"
   top: "mixed_4_tower_1_conv_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 128
@@ -1744,7 +1744,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 3
@@ -1756,9 +1756,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 252.419998169
+    scale_out: 69.25
+    scale_params: 173.460006714
   }
 }
 layer {
@@ -1781,8 +1781,8 @@ layer {
   bottom: "mixed_4_tower_1_conv_2_conv2d_relu"
   top: "mixed_4_tower_1_conv_3_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 128
@@ -1790,7 +1790,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 3
     pad_w: 0
@@ -1802,9 +1802,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 139.050003052
+    scale_out: 79.2600021362
+    scale_params: 185.009994507
   }
 }
 layer {
@@ -1827,8 +1827,8 @@ layer {
   bottom: "mixed_4_tower_1_conv_3_conv2d_relu"
   top: "mixed_4_tower_1_conv_4_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -1836,7 +1836,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 3
@@ -1848,9 +1848,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 159.149993896
+    scale_out: 76.5999984741
+    scale_params: 206.669998169
   }
 }
 layer {
@@ -1885,8 +1885,8 @@ layer {
   bottom: "AVE_pool_mixed_4_pool"
   top: "mixed_4_tower_2_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -1896,7 +1896,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1904,9 +1904,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 6
+    scale_in: 100.790000916
+    scale_out: 93.4000015259
+    scale_params: 116.709999084
   }
 }
 layer {
@@ -1941,8 +1941,8 @@ layer {
   bottom: "ch_concat_mixed_4_chconcat"
   top: "mixed_5_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -1952,7 +1952,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -1960,9 +1960,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 62.3899993896
+    scale_out: 69.3000030518
+    scale_params: 192.5
   }
 }
 layer {
@@ -1985,8 +1985,8 @@ layer {
   bottom: "ch_concat_mixed_4_chconcat"
   top: "mixed_5_tower_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 160
@@ -1996,7 +1996,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -2004,9 +2004,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 62.3899993896
+    scale_out: 54.7299995422
+    scale_params: 252.080001831
   }
 }
 layer {
@@ -2029,8 +2029,8 @@ layer {
   bottom: "mixed_5_tower_conv_conv2d_relu"
   top: "mixed_5_tower_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 160
@@ -2038,7 +2038,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 3
@@ -2050,9 +2050,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 109.88999939
+    scale_out: 54.1800003052
+    scale_params: 196.350006104
   }
 }
 layer {
@@ -2075,8 +2075,8 @@ layer {
   bottom: "mixed_5_tower_conv_1_conv2d_relu"
   top: "mixed_5_tower_conv_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -2084,7 +2084,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 3
     pad_w: 0
@@ -2096,9 +2096,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 108.779998779
+    scale_out: 47.1699981689
+    scale_params: 218.880004883
   }
 }
 layer {
@@ -2121,8 +2121,8 @@ layer {
   bottom: "ch_concat_mixed_4_chconcat"
   top: "mixed_5_tower_1_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 160
@@ -2132,7 +2132,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -2140,9 +2140,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 62.3899993896
+    scale_out: 107.379997253
+    scale_params: 294.489990234
   }
 }
 layer {
@@ -2165,8 +2165,8 @@ layer {
   bottom: "mixed_5_tower_1_conv_conv2d_relu"
   top: "mixed_5_tower_1_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 160
@@ -2174,7 +2174,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 3
     pad_w: 0
@@ -2186,9 +2186,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 215.61000061
+    scale_out: 72.3499984741
+    scale_params: 186.509994507
   }
 }
 layer {
@@ -2211,8 +2211,8 @@ layer {
   bottom: "mixed_5_tower_1_conv_1_conv2d_relu"
   top: "mixed_5_tower_1_conv_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 160
@@ -2220,7 +2220,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 3
@@ -2232,9 +2232,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 145.259994507
+    scale_out: 62.2599983215
+    scale_params: 243.020004272
   }
 }
 layer {
@@ -2257,8 +2257,8 @@ layer {
   bottom: "mixed_5_tower_1_conv_2_conv2d_relu"
   top: "mixed_5_tower_1_conv_3_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 160
@@ -2266,7 +2266,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 3
     pad_w: 0
@@ -2278,9 +2278,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 125.019996643
+    scale_out: 82.0299987793
+    scale_params: 320.420013428
   }
 }
 layer {
@@ -2303,8 +2303,8 @@ layer {
   bottom: "mixed_5_tower_1_conv_3_conv2d_relu"
   top: "mixed_5_tower_1_conv_4_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -2312,7 +2312,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 3
@@ -2324,9 +2324,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 164.699996948
+    scale_out: 78.0699996948
+    scale_params: 216.5
   }
 }
 layer {
@@ -2361,8 +2361,8 @@ layer {
   bottom: "AVE_pool_mixed_5_pool"
   top: "mixed_5_tower_2_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -2372,7 +2372,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -2380,9 +2380,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 101.949996948
+    scale_out: 64.6999969482
+    scale_params: 149.190002441
   }
 }
 layer {
@@ -2417,8 +2417,8 @@ layer {
   bottom: "ch_concat_mixed_5_chconcat"
   top: "mixed_6_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -2428,7 +2428,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -2436,9 +2436,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 47.1699981689
+    scale_out: 67.3399963379
+    scale_params: 165.38999939
   }
 }
 layer {
@@ -2461,8 +2461,8 @@ layer {
   bottom: "ch_concat_mixed_5_chconcat"
   top: "mixed_6_tower_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 160
@@ -2472,7 +2472,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -2480,9 +2480,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 47.1699981689
+    scale_out: 72.6299972534
+    scale_params: 194.589996338
   }
 }
 layer {
@@ -2505,8 +2505,8 @@ layer {
   bottom: "mixed_6_tower_conv_conv2d_relu"
   top: "mixed_6_tower_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 160
@@ -2514,7 +2514,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 3
@@ -2526,9 +2526,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 145.830001831
+    scale_out: 71.2099990845
+    scale_params: 200.419998169
   }
 }
 layer {
@@ -2551,8 +2551,8 @@ layer {
   bottom: "mixed_6_tower_conv_1_conv2d_relu"
   top: "mixed_6_tower_conv_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -2560,7 +2560,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 3
     pad_w: 0
@@ -2572,9 +2572,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 142.979995728
+    scale_out: 71.7600021362
+    scale_params: 248.820007324
   }
 }
 layer {
@@ -2597,8 +2597,8 @@ layer {
   bottom: "ch_concat_mixed_5_chconcat"
   top: "mixed_6_tower_1_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 160
@@ -2608,7 +2608,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -2616,9 +2616,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 47.1699981689
+    scale_out: 89.7200012207
+    scale_params: 276.739990234
   }
 }
 layer {
@@ -2641,8 +2641,8 @@ layer {
   bottom: "mixed_6_tower_1_conv_conv2d_relu"
   top: "mixed_6_tower_1_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 160
@@ -2650,7 +2650,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 3
     pad_w: 0
@@ -2662,9 +2662,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 180.13999939
+    scale_out: 51.8300018311
+    scale_params: 231.600006104
   }
 }
 layer {
@@ -2687,8 +2687,8 @@ layer {
   bottom: "mixed_6_tower_1_conv_1_conv2d_relu"
   top: "mixed_6_tower_1_conv_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 160
@@ -2696,7 +2696,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 3
@@ -2708,9 +2708,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 104.069999695
+    scale_out: 58.4500007629
+    scale_params: 192.809997559
   }
 }
 layer {
@@ -2733,8 +2733,8 @@ layer {
   bottom: "mixed_6_tower_1_conv_2_conv2d_relu"
   top: "mixed_6_tower_1_conv_3_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 160
@@ -2742,7 +2742,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 3
     pad_w: 0
@@ -2754,9 +2754,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 117.370002747
+    scale_out: 54.4000015259
+    scale_params: 210.199996948
   }
 }
 layer {
@@ -2779,8 +2779,8 @@ layer {
   bottom: "mixed_6_tower_1_conv_3_conv2d_relu"
   top: "mixed_6_tower_1_conv_4_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -2788,7 +2788,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 3
@@ -2800,9 +2800,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 109.230003357
+    scale_out: 86.8899993896
+    scale_params: 312.559997559
   }
 }
 layer {
@@ -2837,8 +2837,8 @@ layer {
   bottom: "AVE_pool_mixed_6_pool"
   top: "mixed_6_tower_2_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -2848,7 +2848,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -2856,9 +2856,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 6
+    scale_in: 72.2799987793
+    scale_out: 104.019996643
+    scale_params: 119.339996338
   }
 }
 layer {
@@ -2893,8 +2893,8 @@ layer {
   bottom: "ch_concat_mixed_6_chconcat"
   top: "mixed_7_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -2904,7 +2904,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -2912,9 +2912,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 67.3399963379
+    scale_out: 67.4499969482
+    scale_params: 252.38999939
   }
 }
 layer {
@@ -2937,8 +2937,8 @@ layer {
   bottom: "ch_concat_mixed_6_chconcat"
   top: "mixed_7_tower_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -2948,7 +2948,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -2956,9 +2956,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 67.3399963379
+    scale_out: 64.8700027466
+    scale_params: 369.850006104
   }
 }
 layer {
@@ -2981,8 +2981,8 @@ layer {
   bottom: "mixed_7_tower_conv_conv2d_relu"
   top: "mixed_7_tower_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -2990,7 +2990,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 3
@@ -3002,9 +3002,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 6
-    fl_params: 8
+    scale_in: 130.25
+    scale_out: 52.3899993896
+    scale_params: 260.700012207
   }
 }
 layer {
@@ -3027,8 +3027,8 @@ layer {
   bottom: "mixed_7_tower_conv_1_conv2d_relu"
   top: "mixed_7_tower_conv_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -3036,7 +3036,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 3
     pad_w: 0
@@ -3048,9 +3048,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 105.180000305
+    scale_out: 76.4199981689
+    scale_params: 316.489990234
   }
 }
 layer {
@@ -3073,8 +3073,8 @@ layer {
   bottom: "ch_concat_mixed_6_chconcat"
   top: "mixed_7_tower_1_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -3084,7 +3084,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -3092,9 +3092,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 67.3399963379
+    scale_out: 80.0599975586
+    scale_params: 264.869995117
   }
 }
 layer {
@@ -3117,8 +3117,8 @@ layer {
   bottom: "mixed_7_tower_1_conv_conv2d_relu"
   top: "mixed_7_tower_1_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -3126,7 +3126,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 3
     pad_w: 0
@@ -3138,9 +3138,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 160.740005493
+    scale_out: 72.5599975586
+    scale_params: 273.700012207
   }
 }
 layer {
@@ -3163,8 +3163,8 @@ layer {
   bottom: "mixed_7_tower_1_conv_1_conv2d_relu"
   top: "mixed_7_tower_1_conv_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -3172,7 +3172,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 3
@@ -3184,9 +3184,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 145.690002441
+    scale_out: 67.7699966431
+    scale_params: 273.950012207
   }
 }
 layer {
@@ -3209,8 +3209,8 @@ layer {
   bottom: "mixed_7_tower_1_conv_2_conv2d_relu"
   top: "mixed_7_tower_1_conv_3_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -3218,7 +3218,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 3
     pad_w: 0
@@ -3230,9 +3230,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 136.080001831
+    scale_out: 68.7900009155
+    scale_params: 271.679992676
   }
 }
 layer {
@@ -3255,8 +3255,8 @@ layer {
   bottom: "mixed_7_tower_1_conv_3_conv2d_relu"
   top: "mixed_7_tower_1_conv_4_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -3264,7 +3264,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 3
@@ -3276,9 +3276,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 138.130004883
+    scale_out: 83.0400009155
+    scale_params: 331.309997559
   }
 }
 layer {
@@ -3313,8 +3313,8 @@ layer {
   bottom: "AVE_pool_mixed_7_pool"
   top: "mixed_7_tower_2_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -3324,7 +3324,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -3332,9 +3332,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 116.220001221
+    scale_out: 93.6600036621
+    scale_params: 129.759994507
   }
 }
 layer {
@@ -3369,8 +3369,8 @@ layer {
   bottom: "ch_concat_mixed_7_chconcat"
   top: "mixed_8_tower_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -3380,7 +3380,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -3388,9 +3388,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 67.4499969482
+    scale_out: 75.5800018311
+    scale_params: 245.309997559
   }
 }
 layer {
@@ -3413,8 +3413,8 @@ layer {
   bottom: "mixed_8_tower_conv_conv2d_relu"
   top: "mixed_8_tower_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 320
@@ -3424,7 +3424,7 @@ layer {
     stride: 2
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -3432,9 +3432,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 6
-    fl_params: 7
+    scale_in: 151.75
+    scale_out: 40.4199981689
+    scale_params: 171.190002441
   }
 }
 layer {
@@ -3457,8 +3457,8 @@ layer {
   bottom: "ch_concat_mixed_7_chconcat"
   top: "mixed_8_tower_1_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -3468,7 +3468,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -3476,9 +3476,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 67.4499969482
+    scale_out: 73.7399978638
+    scale_params: 135.559997559
   }
 }
 layer {
@@ -3501,8 +3501,8 @@ layer {
   bottom: "mixed_8_tower_1_conv_conv2d_relu"
   top: "mixed_8_tower_1_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -3510,7 +3510,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 3
@@ -3522,9 +3522,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 6
-    fl_params: 6
+    scale_in: 148.070007324
+    scale_out: 57.2099990845
+    scale_params: 123.540000916
   }
 }
 layer {
@@ -3547,8 +3547,8 @@ layer {
   bottom: "mixed_8_tower_1_conv_1_conv2d_relu"
   top: "mixed_8_tower_1_conv_2_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -3556,7 +3556,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 3
     pad_w: 0
@@ -3568,9 +3568,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 114.86000061
+    scale_out: 96.2099990845
+    scale_params: 310.769989014
   }
 }
 layer {
@@ -3593,8 +3593,8 @@ layer {
   bottom: "mixed_8_tower_1_conv_2_conv2d_relu"
   top: "mixed_8_tower_1_conv_3_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -3604,7 +3604,7 @@ layer {
     stride: 2
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -3612,9 +3612,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 193.179992676
+    scale_out: 67.4700012207
+    scale_params: 313.369995117
   }
 }
 layer {
@@ -3660,8 +3660,8 @@ layer {
   bottom: "ch_concat_mixed_8_chconcat"
   top: "mixed_9_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 320
@@ -3670,7 +3670,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     kernel_h: 1
     kernel_w: 1
@@ -3680,9 +3680,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 8
-    fl_params: 8
+    scale_in: 40.4199981689
+    scale_out: 156.029998779
+    scale_params: 400.739990234
   }
 }
 layer {
@@ -3705,8 +3705,8 @@ layer {
   bottom: "ch_concat_mixed_8_chconcat"
   top: "mixed_9_tower_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 384
@@ -3716,7 +3716,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -3724,9 +3724,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 40.4199981689
+    scale_out: 87.5299987793
+    scale_params: 289.25
   }
 }
 layer {
@@ -3749,8 +3749,8 @@ layer {
   bottom: "mixed_9_tower_conv_conv2d_relu"
   top: "mixed_9_tower_mixed_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 384
@@ -3758,7 +3758,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 1
@@ -3770,9 +3770,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 175.759994507
+    scale_out: 103.349998474
+    scale_params: 346.429992676
   }
 }
 layer {
@@ -3795,8 +3795,8 @@ layer {
   bottom: "mixed_9_tower_conv_conv2d_relu"
   top: "mixed_9_tower_mixed_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 384
@@ -3804,7 +3804,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 1
     pad_w: 0
@@ -3816,9 +3816,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 175.759994507
+    scale_out: 93.3399963379
+    scale_params: 263.369995117
   }
 }
 layer {
@@ -3841,8 +3841,8 @@ layer {
   bottom: "ch_concat_mixed_8_chconcat"
   top: "mixed_9_tower_1_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 448
@@ -3852,7 +3852,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -3860,9 +3860,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 7
+    scale_in: 40.4199981689
+    scale_out: 70.1999969482
+    scale_params: 241.759994507
   }
 }
 layer {
@@ -3885,8 +3885,8 @@ layer {
   bottom: "mixed_9_tower_1_conv_conv2d_relu"
   top: "mixed_9_tower_1_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 384
@@ -3896,7 +3896,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -3904,9 +3904,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 6
-    fl_params: 9
+    scale_in: 140.960006714
+    scale_out: 63.2599983215
+    scale_params: 514.510009766
   }
 }
 layer {
@@ -3929,8 +3929,8 @@ layer {
   bottom: "mixed_9_tower_1_conv_1_conv2d_relu"
   top: "mixed_9_tower_1_mixed_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 384
@@ -3938,7 +3938,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 1
@@ -3950,9 +3950,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 9
+    scale_in: 127.019996643
+    scale_out: 98.9100036621
+    scale_params: 570.369995117
   }
 }
 layer {
@@ -3975,8 +3975,8 @@ layer {
   bottom: "mixed_9_tower_1_conv_1_conv2d_relu"
   top: "mixed_9_tower_1_mixed_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 384
@@ -3984,7 +3984,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 1
     pad_w: 0
@@ -3996,9 +3996,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 127.019996643
+    scale_out: 99.2799987793
+    scale_params: 365.929992676
   }
 }
 layer {
@@ -4033,8 +4033,8 @@ layer {
   bottom: "AVE_pool_mixed_9_pool"
   top: "mixed_9_tower_2_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -4044,7 +4044,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -4052,9 +4052,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 8
-    fl_params: 6
+    scale_in: 75.75
+    scale_out: 153.800003052
+    scale_params: 119.88999939
   }
 }
 layer {
@@ -4091,8 +4091,8 @@ layer {
   bottom: "ch_concat_mixed_9_chconcat"
   top: "mixed_10_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 320
@@ -4101,7 +4101,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     kernel_h: 1
     kernel_w: 1
@@ -4111,9 +4111,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 5
-    fl_params: 4
+    scale_in: 93.3399963379
+    scale_out: 16.8299999237
+    scale_params: 19.4200000763
   }
 }
 layer {
@@ -4136,8 +4136,8 @@ layer {
   bottom: "ch_concat_mixed_9_chconcat"
   top: "mixed_10_tower_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 384
@@ -4147,7 +4147,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -4155,9 +4155,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 6
-    fl_params: 6
+    scale_in: 93.3399963379
+    scale_out: 61.1500015259
+    scale_params: 105.769996643
   }
 }
 layer {
@@ -4180,8 +4180,8 @@ layer {
   bottom: "mixed_10_tower_conv_conv2d_relu"
   top: "mixed_10_tower_mixed_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 384
@@ -4189,7 +4189,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 1
@@ -4201,9 +4201,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 4
-    fl_params: 5
+    scale_in: 122.779998779
+    scale_out: 9.39999961853
+    scale_params: 35.6800003052
   }
 }
 layer {
@@ -4226,8 +4226,8 @@ layer {
   bottom: "mixed_10_tower_conv_conv2d_relu"
   top: "mixed_10_tower_mixed_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 384
@@ -4235,7 +4235,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 1
     pad_w: 0
@@ -4247,9 +4247,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 4
-    fl_params: 5
+    scale_in: 122.779998779
+    scale_out: 9.22000026703
+    scale_params: 37.3199996948
   }
 }
 layer {
@@ -4272,8 +4272,8 @@ layer {
   bottom: "ch_concat_mixed_9_chconcat"
   top: "mixed_10_tower_1_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 448
@@ -4283,7 +4283,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -4291,9 +4291,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 6
-    fl_params: 6
+    scale_in: 93.3399963379
+    scale_out: 60.1800003052
+    scale_params: 92.4100036621
   }
 }
 layer {
@@ -4316,8 +4316,8 @@ layer {
   bottom: "mixed_10_tower_1_conv_conv2d_relu"
   top: "mixed_10_tower_1_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 384
@@ -4327,7 +4327,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -4335,9 +4335,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 6
-    fl_layer_out: 7
-    fl_params: 8
+    scale_in: 120.839996338
+    scale_out: 94.8700027466
+    scale_params: 345.420013428
   }
 }
 layer {
@@ -4360,8 +4360,8 @@ layer {
   bottom: "mixed_10_tower_1_conv_1_conv2d_relu"
   top: "mixed_10_tower_1_mixed_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 384
@@ -4369,7 +4369,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 0
     pad_w: 1
@@ -4381,9 +4381,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 4
-    fl_params: 5
+    scale_in: 190.479995728
+    scale_out: 8.35000038147
+    scale_params: 44.3199996948
   }
 }
 layer {
@@ -4406,8 +4406,8 @@ layer {
   bottom: "mixed_10_tower_1_conv_1_conv2d_relu"
   top: "mixed_10_tower_1_mixed_conv_1_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 384
@@ -4415,7 +4415,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
     pad_h: 1
     pad_w: 0
@@ -4427,9 +4427,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 4
-    fl_params: 5
+    scale_in: 190.479995728
+    scale_out: 10.9600000381
+    scale_params: 44.2700004578
   }
 }
 layer {
@@ -4464,8 +4464,8 @@ layer {
   bottom: "MAX_pool_mixed_10_pool"
   top: "mixed_10_tower_2_conv_conv2d"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   convolution_param {
     num_output: 192
@@ -4475,7 +4475,7 @@ layer {
     stride: 1
     weight_filler {
       type: "gaussian"
-      std: 0.01
+      std: 0.00999999977648
     }
   }
   quantization_param {
@@ -4483,9 +4483,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 7
-    fl_layer_out: 5
-    fl_params: 6
+    scale_in: 93.3399963379
+    scale_out: 19.9799995422
+    scale_params: 81.5699996948
   }
 }
 layer {
@@ -4534,6 +4534,7 @@ layer {
   bottom: "global_pool"
   top: "global_pool"
   dropout_param {
+    dropout_ratio: 0.800000011921
   }
 }
 layer {
@@ -4548,12 +4549,12 @@ layer {
   bottom: "flatten"
   top: "fc1"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   inner_product_param {
     num_output: 1000
@@ -4562,7 +4563,37 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
 }
+layer {
+  name: "loss"
+  type: "SoftmaxWithLoss"
+  bottom: "fc1"
+  bottom: "label"
+  top: "loss"
+}
+layer {
+  name: "acc/top-1"
+  type: "Accuracy"
+  bottom: "fc1"
+  bottom: "label"
+  top: "acc/top-1"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  name: "acc/top-5"
+  type: "Accuracy"
+  bottom: "fc1"
+  bottom: "label"
+  top: "acc/top-5"
+  include {
+    phase: TEST
+  }
+  accuracy_param {
+    top_k: 5
+  }
+}
diff --git a/models/intel_optimized_models/int8/resnet50_int8.prototxt b/models/intel_optimized_models/int8/resnet50_int8.prototxt
index 2490f0be2..c48020181 100644
--- a/models/intel_optimized_models/int8/resnet50_int8.prototxt
+++ b/models/intel_optimized_models/int8/resnet50_int8.prototxt
@@ -44,7 +44,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
 }
@@ -100,7 +100,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -108,9 +108,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 3
-    fl_params: 6
+    scale_in: 8.38000011444
+    scale_out: 5.73999977112
+    scale_params: 75.9199981689
   }
 }
 layer {
@@ -146,7 +146,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -154,9 +154,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 4
-    fl_params: 7
+    scale_in: 8.38000011444
+    scale_out: 17.6599998474
+    scale_params: 151.089996338
   }
 }
 layer {
@@ -200,7 +200,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -208,9 +208,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 4
-    fl_params: 8
+    scale_in: 17.6599998474
+    scale_out: 19.9799995422
+    scale_params: 416.320007324
   }
 }
 layer {
@@ -254,7 +254,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -262,9 +262,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 3
-    fl_params: 6
+    scale_in: 19.9799995422
+    scale_out: 5.73999977112
+    scale_params: 72.1699981689
   }
 }
 layer {
@@ -317,7 +317,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -325,9 +325,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 4
-    fl_params: 7
+    scale_in: 11.5200004578
+    scale_out: 17.9099998474
+    scale_params: 192.330001831
   }
 }
 layer {
@@ -371,7 +371,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -379,9 +379,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 4
-    fl_params: 7
+    scale_in: 17.9099998474
+    scale_out: 19.5799999237
+    scale_params: 210.529998779
   }
 }
 layer {
@@ -425,7 +425,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -433,9 +433,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 3
-    fl_params: 6
+    scale_in: 19.5799999237
+    scale_out: 5.73999977112
+    scale_params: 88.4599990845
   }
 }
 layer {
@@ -488,7 +488,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -496,9 +496,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 4
-    fl_params: 8
+    scale_in: 11.5200004578
+    scale_out: 18.6000003815
+    scale_params: 360.359985352
   }
 }
 layer {
@@ -542,7 +542,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -550,9 +550,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 3
-    fl_params: 8
+    scale_in: 18.6000003815
+    scale_out: 13.5799999237
+    scale_params: 308.029998779
   }
 }
 layer {
@@ -596,7 +596,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -604,9 +604,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 3
-    fl_params: 6
+    scale_in: 13.5799999237
+    scale_out: 5.73999977112
+    scale_params: 103.910003662
   }
 }
 layer {
@@ -659,7 +659,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -667,9 +667,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 3
-    fl_params: 7
+    scale_in: 11.5200004578
+    scale_out: 4.78000020981
+    scale_params: 135.169998169
   }
 }
 layer {
@@ -705,7 +705,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -713,9 +713,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 4
-    fl_params: 8
+    scale_in: 11.5200004578
+    scale_out: 19.0499992371
+    scale_params: 277.709991455
   }
 }
 layer {
@@ -759,7 +759,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -767,9 +767,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 4
-    fl_params: 8
+    scale_in: 19.0499992371
+    scale_out: 25.5400009155
+    scale_params: 320.339996338
   }
 }
 layer {
@@ -813,7 +813,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -821,9 +821,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 3
-    fl_params: 6
+    scale_in: 25.5400009155
+    scale_out: 4.78000020981
+    scale_params: 65.7200012207
   }
 }
 layer {
@@ -876,7 +876,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -884,9 +884,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 4
-    fl_params: 8
+    scale_in: 9.59000015259
+    scale_out: 24.1900005341
+    scale_params: 493.920013428
   }
 }
 layer {
@@ -930,7 +930,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -938,9 +938,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 4
-    fl_params: 8
+    scale_in: 24.1900005341
+    scale_out: 20.4899997711
+    scale_params: 308.959991455
   }
 }
 layer {
@@ -984,7 +984,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -992,9 +992,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 3
-    fl_params: 5
+    scale_in: 20.4899997711
+    scale_out: 4.78000020981
+    scale_params: 55.6899986267
   }
 }
 layer {
@@ -1047,7 +1047,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1055,9 +1055,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 3
-    fl_params: 7
+    scale_in: 9.59000015259
+    scale_out: 9.35999965668
+    scale_params: 142.929992676
   }
 }
 layer {
@@ -1101,7 +1101,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1109,9 +1109,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 1
-    fl_params: 6
+    scale_in: 9.35999965668
+    scale_out: 3.74000000954
+    scale_params: 88.1699981689
   }
 }
 layer {
@@ -1155,7 +1155,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1163,9 +1163,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 1
-    fl_layer_out: 3
-    fl_params: 6
+    scale_in: 3.74000000954
+    scale_out: 4.78000020981
+    scale_params: 66.2300033569
   }
 }
 layer {
@@ -1218,7 +1218,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1226,9 +1226,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 2
-    fl_params: 7
+    scale_in: 9.59000015259
+    scale_out: 7.40999984741
+    scale_params: 240.589996338
   }
 }
 layer {
@@ -1272,7 +1272,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1280,9 +1280,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 3
-    fl_params: 8
+    scale_in: 7.40999984741
+    scale_out: 15.0600004196
+    scale_params: 314.239990234
   }
 }
 layer {
@@ -1326,7 +1326,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1334,9 +1334,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 3
-    fl_params: 6
+    scale_in: 15.0600004196
+    scale_out: 4.78000020981
+    scale_params: 113.980003357
   }
 }
 layer {
@@ -1389,7 +1389,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1397,9 +1397,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 2
-    fl_params: 7
+    scale_in: 9.59000015259
+    scale_out: 3.70000004768
+    scale_params: 213.380004883
   }
 }
 layer {
@@ -1435,7 +1435,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1443,9 +1443,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 3
-    fl_params: 8
+    scale_in: 9.59000015259
+    scale_out: 12.7700004578
+    scale_params: 254.339996338
   }
 }
 layer {
@@ -1489,7 +1489,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1497,9 +1497,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 3
-    fl_params: 8
+    scale_in: 12.7700004578
+    scale_out: 15.3699998856
+    scale_params: 473.709991455
   }
 }
 layer {
@@ -1543,7 +1543,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1551,9 +1551,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 2
-    fl_params: 6
+    scale_in: 15.3699998856
+    scale_out: 3.70000004768
+    scale_params: 75.6200027466
   }
 }
 layer {
@@ -1606,7 +1606,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1614,9 +1614,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 3
-    fl_params: 8
+    scale_in: 7.42999982834
+    scale_out: 12.2600002289
+    scale_params: 325.369995117
   }
 }
 layer {
@@ -1660,7 +1660,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1668,9 +1668,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 2
-    fl_params: 7
+    scale_in: 12.2600002289
+    scale_out: 6.44000005722
+    scale_params: 131.820007324
   }
 }
 layer {
@@ -1714,7 +1714,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1722,9 +1722,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 2
-    fl_params: 6
+    scale_in: 6.44000005722
+    scale_out: 3.70000004768
+    scale_params: 67.4400024414
   }
 }
 layer {
@@ -1777,7 +1777,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1785,9 +1785,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 3
-    fl_params: 8
+    scale_in: 7.42999982834
+    scale_out: 11.529999733
+    scale_params: 369.480010986
   }
 }
 layer {
@@ -1831,7 +1831,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1839,9 +1839,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 2
-    fl_params: 7
+    scale_in: 11.529999733
+    scale_out: 6.94999980927
+    scale_params: 139.050003052
   }
 }
 layer {
@@ -1885,7 +1885,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1893,9 +1893,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 2
-    fl_params: 6
+    scale_in: 6.94999980927
+    scale_out: 3.70000004768
+    scale_params: 76.9700012207
   }
 }
 layer {
@@ -1948,7 +1948,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -1956,9 +1956,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 3
-    fl_params: 8
+    scale_in: 7.42999982834
+    scale_out: 10.7299995422
+    scale_params: 312.220001221
   }
 }
 layer {
@@ -2002,7 +2002,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2010,9 +2010,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 2
-    fl_params: 7
+    scale_in: 10.7299995422
+    scale_out: 5.40000009537
+    scale_params: 201.61000061
   }
 }
 layer {
@@ -2056,7 +2056,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2064,9 +2064,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 2
-    fl_params: 6
+    scale_in: 5.40000009537
+    scale_out: 3.70000004768
+    scale_params: 77.1500015259
   }
 }
 layer {
@@ -2119,7 +2119,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2127,9 +2127,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 3
-    fl_params: 8
+    scale_in: 7.42999982834
+    scale_out: 11.7600002289
+    scale_params: 293.720001221
   }
 }
 layer {
@@ -2173,7 +2173,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2181,9 +2181,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 2
-    fl_params: 7
+    scale_in: 11.7600002289
+    scale_out: 6.51999998093
+    scale_params: 185.36000061
   }
 }
 layer {
@@ -2227,7 +2227,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2235,9 +2235,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 2
-    fl_params: 6
+    scale_in: 6.51999998093
+    scale_out: 3.70000004768
+    scale_params: 98.8199996948
   }
 }
 layer {
@@ -2290,7 +2290,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2298,9 +2298,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 4
-    fl_params: 8
+    scale_in: 7.42999982834
+    scale_out: 16.2900009155
+    scale_params: 300.049987793
   }
 }
 layer {
@@ -2344,7 +2344,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2352,9 +2352,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 2
-    fl_params: 7
+    scale_in: 16.2900009155
+    scale_out: 5.01999998093
+    scale_params: 240.550003052
   }
 }
 layer {
@@ -2398,7 +2398,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2406,9 +2406,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 2
-    fl_params: 6
+    scale_in: 5.01999998093
+    scale_out: 3.70000004768
+    scale_params: 93.3000030518
   }
 }
 layer {
@@ -2461,7 +2461,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2469,9 +2469,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 0
-    fl_params: 5
+    scale_in: 7.42999982834
+    scale_out: 0.939999997616
+    scale_params: 45.0
   }
 }
 layer {
@@ -2507,7 +2507,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2515,9 +2515,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 4
-    fl_params: 8
+    scale_in: 7.42999982834
+    scale_out: 21.5699996948
+    scale_params: 375.869995117
   }
 }
 layer {
@@ -2561,7 +2561,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2569,9 +2569,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 4
-    fl_params: 7
+    scale_in: 21.5699996948
+    scale_out: 25.2000007629
+    scale_params: 228.160003662
   }
 }
 layer {
@@ -2615,7 +2615,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2623,9 +2623,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 0
-    fl_params: 4
+    scale_in: 25.2000007629
+    scale_out: 0.939999997616
+    scale_params: 27.1299991608
   }
 }
 layer {
@@ -2678,7 +2678,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2686,9 +2686,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 0
-    fl_layer_out: 4
-    fl_params: 9
+    scale_in: 1.87999999523
+    scale_out: 25.4400005341
+    scale_params: 999.760009766
   }
 }
 layer {
@@ -2732,7 +2732,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2740,9 +2740,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 4
-    fl_params: 7
+    scale_in: 25.4400005341
+    scale_out: 29.2800006866
+    scale_params: 153.630004883
   }
 }
 layer {
@@ -2786,7 +2786,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2794,9 +2794,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 0
-    fl_params: 5
+    scale_in: 29.2800006866
+    scale_out: 0.939999997616
+    scale_params: 35.3400001526
   }
 }
 layer {
@@ -2849,7 +2849,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2857,9 +2857,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 0
-    fl_layer_out: 4
-    fl_params: 9
+    scale_in: 1.87999999523
+    scale_out: 21.8099994659
+    scale_params: 1013.09997559
   }
 }
 layer {
@@ -2903,7 +2903,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2911,9 +2911,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 3
-    fl_params: 8
+    scale_in: 21.8099994659
+    scale_out: 14.7100000381
+    scale_params: 321.25
   }
 }
 layer {
@@ -2957,7 +2957,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0.2
+      value: 0.20000000298
     }
   }
   quantization_param {
@@ -2965,9 +2965,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 0
-    fl_params: 4
+    scale_in: 14.7100000381
+    scale_out: 0.939999997616
+    scale_params: 23.2399997711
   }
 }
 layer {
@@ -3027,7 +3027,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
 }
@@ -3038,7 +3038,7 @@ layer {
   bottom: "label"
   top: "accuracy-top1"
   include {
-    phase: TEST 
+    phase: TEST
   }
 }
 layer {
@@ -3048,7 +3048,7 @@ layer {
   bottom: "label"
   top: "accuracy-top5"
   include {
-    phase: TEST 
+    phase: TEST
   }
   accuracy_param {
     top_k: 5
diff --git a/models/intel_optimized_models/int8/resnet50_sparse_int8.prototxt b/models/intel_optimized_models/int8/resnet50_sparse_int8.prototxt
new file mode 100644
index 000000000..402b24a63
--- /dev/null
+++ b/models/intel_optimized_models/int8/resnet50_sparse_int8.prototxt
@@ -0,0 +1,3099 @@
+name: "ResNet-50"
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "data"
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+      value: 0.01
+    }    
+    shape {
+      dim: 64
+      dim: 3
+      dim: 224
+      dim: 224
+    }    
+  }
+}
+layer {
+  name: "data"
+  type: "DummyData"
+  top: "label"
+  dummy_data_param {
+    data_filler {
+      type: "constant"
+    }    
+    shape {
+      dim: 64
+    }    
+  }
+}
+layer {
+  name: "conv1"
+  type: "Convolution"
+  bottom: "data"
+  top: "conv1"
+  convolution_param {
+    num_output: 64
+    pad: 3
+    kernel_size: 7
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+}
+layer {
+  name: "bn_conv1"
+  type: "BatchNorm"
+  bottom: "conv1"
+  top: "conv1"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale_conv1"
+  type: "Scale"
+  bottom: "conv1"
+  top: "conv1"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "conv1_relu"
+  type: "ReLU"
+  bottom: "conv1"
+  top: "conv1"
+  relu_param {
+  }
+}
+layer {
+  name: "pool1"
+  type: "Pooling"
+  bottom: "conv1"
+  top: "pool1"
+  pooling_param {
+    pool: MAX
+    kernel_size: 3
+    stride: 2
+  }
+}
+layer {
+  name: "res2a_branch1"
+  type: "Convolution"
+  bottom: "pool1"
+  top: "res2a_branch1"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 8.38000011444
+    scale_out: 6.03000020981
+    scale_params: 75.9199981689
+  }
+}
+layer {
+  name: "bn2a_branch1"
+  type: "BatchNorm"
+  bottom: "res2a_branch1"
+  top: "res2a_branch1"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2a_branch1"
+  type: "Scale"
+  bottom: "res2a_branch1"
+  top: "res2a_branch1"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2a_branch2a"
+  type: "Convolution"
+  bottom: "pool1"
+  top: "res2a_branch2a"
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 8.38000011444
+    scale_out: 17.6599998474
+    scale_params: 151.089996338
+  }
+}
+layer {
+  name: "bn2a_branch2a"
+  type: "BatchNorm"
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2a_branch2a"
+  type: "Scale"
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2a_branch2a_relu"
+  type: "ReLU"
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res2a_branch2b"
+  type: "Convolution"
+  bottom: "res2a_branch2a"
+  top: "res2a_branch2b"
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 17.6599998474
+    scale_out: 19.9799995422
+    scale_params: 416.320007324
+  }
+}
+layer {
+  name: "bn2a_branch2b"
+  type: "BatchNorm"
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2a_branch2b"
+  type: "Scale"
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2a_branch2b_relu"
+  type: "ReLU"
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res2a_branch2c"
+  type: "Convolution"
+  bottom: "res2a_branch2b"
+  top: "res2a_branch2c"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 19.9799995422
+    scale_out: 6.03000020981
+    scale_params: 72.1699981689
+  }
+}
+layer {
+  name: "bn2a_branch2c"
+  type: "BatchNorm"
+  bottom: "res2a_branch2c"
+  top: "res2a_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2a_branch2c"
+  type: "Scale"
+  bottom: "res2a_branch2c"
+  top: "res2a_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2a"
+  type: "Eltwise"
+  bottom: "res2a_branch1"
+  bottom: "res2a_branch2c"
+  top: "res2a"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res2a_relu"
+  type: "ReLU"
+  bottom: "res2a"
+  top: "res2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res2b_branch2a"
+  type: "Convolution"
+  bottom: "res2a"
+  top: "res2b_branch2a"
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 12.1099996567
+    scale_out: 17.9099998474
+    scale_params: 192.330001831
+  }
+}
+layer {
+  name: "bn2b_branch2a"
+  type: "BatchNorm"
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2b_branch2a"
+  type: "Scale"
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2b_branch2a_relu"
+  type: "ReLU"
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res2b_branch2b"
+  type: "Convolution"
+  bottom: "res2b_branch2a"
+  top: "res2b_branch2b"
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 17.9099998474
+    scale_out: 19.5799999237
+    scale_params: 210.529998779
+  }
+}
+layer {
+  name: "bn2b_branch2b"
+  type: "BatchNorm"
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2b_branch2b"
+  type: "Scale"
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2b_branch2b_relu"
+  type: "ReLU"
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res2b_branch2c"
+  type: "Convolution"
+  bottom: "res2b_branch2b"
+  top: "res2b_branch2c"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 19.5799999237
+    scale_out: 6.03000020981
+    scale_params: 88.4599990845
+  }
+}
+layer {
+  name: "bn2b_branch2c"
+  type: "BatchNorm"
+  bottom: "res2b_branch2c"
+  top: "res2b_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2b_branch2c"
+  type: "Scale"
+  bottom: "res2b_branch2c"
+  top: "res2b_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2b"
+  type: "Eltwise"
+  bottom: "res2a"
+  bottom: "res2b_branch2c"
+  top: "res2b"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res2b_relu"
+  type: "ReLU"
+  bottom: "res2b"
+  top: "res2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res2b_p"
+  type: "Pooling"
+  bottom: "res2b"
+  top: "res2b_p"
+  pooling_param {
+    pool: MAX
+    kernel_size: 1
+    stride: 2
+  }
+}
+layer {
+  name: "res2c_branch2a"
+  type: "Convolution"
+  bottom: "res2b"
+  top: "res2c_branch2a"
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 12.1099996567
+    scale_out: 18.6000003815
+    scale_params: 360.359985352
+  }
+}
+layer {
+  name: "bn2c_branch2a"
+  type: "BatchNorm"
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2c_branch2a"
+  type: "Scale"
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2c_branch2a_relu"
+  type: "ReLU"
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res2c_branch2b"
+  type: "Convolution"
+  bottom: "res2c_branch2a"
+  top: "res2c_branch2b"
+  convolution_param {
+    num_output: 64
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 18.6000003815
+    scale_out: 16.9200000763
+    scale_params: 308.029998779
+  }
+}
+layer {
+  name: "bn2c_branch2b"
+  type: "BatchNorm"
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2c_branch2b"
+  type: "Scale"
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2c_branch2b_relu"
+  type: "ReLU"
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res2c_branch2c"
+  type: "Convolution"
+  bottom: "res2c_branch2b"
+  top: "res2c_branch2c"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 16.9200000763
+    scale_out: 5.73999977112
+    scale_params: 103.910003662
+  }
+}
+layer {
+  name: "bn2c_branch2c"
+  type: "BatchNorm"
+  bottom: "res2c_branch2c"
+  top: "res2c_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale2c_branch2c"
+  type: "Scale"
+  bottom: "res2c_branch2c"
+  top: "res2c_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res2c"
+  type: "Eltwise"
+  bottom: "res2b_p"
+  bottom: "res2c_branch2c"
+  top: "res2c"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res2c_relu"
+  type: "ReLU"
+  bottom: "res2c"
+  top: "res2c"
+  relu_param {
+  }
+}
+layer {
+  name: "res3a_branch1"
+  type: "Convolution"
+  bottom: "res2c"
+  top: "res3a_branch1"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 11.5200004578
+    scale_out: 4.65000009537
+    scale_params: 135.169998169
+  }
+}
+layer {
+  name: "bn3a_branch1"
+  type: "BatchNorm"
+  bottom: "res3a_branch1"
+  top: "res3a_branch1"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3a_branch1"
+  type: "Scale"
+  bottom: "res3a_branch1"
+  top: "res3a_branch1"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3a_branch2a"
+  type: "Convolution"
+  bottom: "res2c"
+  top: "res3a_branch2a"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 11.5200004578
+    scale_out: 19.0499992371
+    scale_params: 277.709991455
+  }
+}
+layer {
+  name: "bn3a_branch2a"
+  type: "BatchNorm"
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3a_branch2a"
+  type: "Scale"
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3a_branch2a_relu"
+  type: "ReLU"
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res3a_branch2b"
+  type: "Convolution"
+  bottom: "res3a_branch2a"
+  top: "res3a_branch2b"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 19.0499992371
+    scale_out: 25.5400009155
+    scale_params: 320.339996338
+  }
+}
+layer {
+  name: "bn3a_branch2b"
+  type: "BatchNorm"
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3a_branch2b"
+  type: "Scale"
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3a_branch2b_relu"
+  type: "ReLU"
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res3a_branch2c"
+  type: "Convolution"
+  bottom: "res3a_branch2b"
+  top: "res3a_branch2c"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 25.5400009155
+    scale_out: 4.65000009537
+    scale_params: 65.7200012207
+  }
+}
+layer {
+  name: "bn3a_branch2c"
+  type: "BatchNorm"
+  bottom: "res3a_branch2c"
+  top: "res3a_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3a_branch2c"
+  type: "Scale"
+  bottom: "res3a_branch2c"
+  top: "res3a_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3a"
+  type: "Eltwise"
+  bottom: "res3a_branch1"
+  bottom: "res3a_branch2c"
+  top: "res3a"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res3a_relu"
+  type: "ReLU"
+  bottom: "res3a"
+  top: "res3a"
+  relu_param {
+  }
+}
+layer {
+  name: "res3b_branch2a"
+  type: "Convolution"
+  bottom: "res3a"
+  top: "res3b_branch2a"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 9.32999992371
+    scale_out: 24.1900005341
+    scale_params: 493.920013428
+  }
+}
+layer {
+  name: "bn3b_branch2a"
+  type: "BatchNorm"
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3b_branch2a"
+  type: "Scale"
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3b_branch2a_relu"
+  type: "ReLU"
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res3b_branch2b"
+  type: "Convolution"
+  bottom: "res3b_branch2a"
+  top: "res3b_branch2b"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 24.1900005341
+    scale_out: 20.4899997711
+    scale_params: 308.959991455
+  }
+}
+layer {
+  name: "bn3b_branch2b"
+  type: "BatchNorm"
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3b_branch2b"
+  type: "Scale"
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3b_branch2b_relu"
+  type: "ReLU"
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res3b_branch2c"
+  type: "Convolution"
+  bottom: "res3b_branch2b"
+  top: "res3b_branch2c"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 20.4899997711
+    scale_out: 4.65000009537
+    scale_params: 55.6899986267
+  }
+}
+layer {
+  name: "bn3b_branch2c"
+  type: "BatchNorm"
+  bottom: "res3b_branch2c"
+  top: "res3b_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3b_branch2c"
+  type: "Scale"
+  bottom: "res3b_branch2c"
+  top: "res3b_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3b"
+  type: "Eltwise"
+  bottom: "res3a"
+  bottom: "res3b_branch2c"
+  top: "res3b"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res3b_relu"
+  type: "ReLU"
+  bottom: "res3b"
+  top: "res3b"
+  relu_param {
+  }
+}
+layer {
+  name: "res3c_branch2a"
+  type: "Convolution"
+  bottom: "res3b"
+  top: "res3c_branch2a"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 9.32999992371
+    scale_out: 9.35999965668
+    scale_params: 142.929992676
+  }
+}
+layer {
+  name: "bn3c_branch2a"
+  type: "BatchNorm"
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3c_branch2a"
+  type: "Scale"
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3c_branch2a_relu"
+  type: "ReLU"
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res3c_branch2b"
+  type: "Convolution"
+  bottom: "res3c_branch2a"
+  top: "res3c_branch2b"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 9.35999965668
+    scale_out: 3.70000004768
+    scale_params: 88.1699981689
+  }
+}
+layer {
+  name: "bn3c_branch2b"
+  type: "BatchNorm"
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3c_branch2b"
+  type: "Scale"
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3c_branch2b_relu"
+  type: "ReLU"
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res3c_branch2c"
+  type: "Convolution"
+  bottom: "res3c_branch2b"
+  top: "res3c_branch2c"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 3.70000004768
+    scale_out: 4.65000009537
+    scale_params: 66.2300033569
+  }
+}
+layer {
+  name: "bn3c_branch2c"
+  type: "BatchNorm"
+  bottom: "res3c_branch2c"
+  top: "res3c_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3c_branch2c"
+  type: "Scale"
+  bottom: "res3c_branch2c"
+  top: "res3c_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3c"
+  type: "Eltwise"
+  bottom: "res3b"
+  bottom: "res3c_branch2c"
+  top: "res3c"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res3c_relu"
+  type: "ReLU"
+  bottom: "res3c"
+  top: "res3c"
+  relu_param {
+  }
+}
+layer {
+  name: "res3c_p"
+  type: "Pooling"
+  bottom: "res3c"
+  top: "res3c_p"
+  pooling_param {
+    pool: MAX
+    kernel_size: 1
+    stride: 2
+  }
+}
+layer {
+  name: "res3d_branch2a"
+  type: "Convolution"
+  bottom: "res3c"
+  top: "res3d_branch2a"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 9.32999992371
+    scale_out: 7.23000001907
+    scale_params: 240.589996338
+  }
+}
+layer {
+  name: "bn3d_branch2a"
+  type: "BatchNorm"
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3d_branch2a"
+  type: "Scale"
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3d_branch2a_relu"
+  type: "ReLU"
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res3d_branch2b"
+  type: "Convolution"
+  bottom: "res3d_branch2a"
+  top: "res3d_branch2b"
+  convolution_param {
+    num_output: 128
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 7.23000001907
+    scale_out: 14.6999998093
+    scale_params: 314.239990234
+  }
+}
+layer {
+  name: "bn3d_branch2b"
+  type: "BatchNorm"
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3d_branch2b"
+  type: "Scale"
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3d_branch2b_relu"
+  type: "ReLU"
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res3d_branch2c"
+  type: "Convolution"
+  bottom: "res3d_branch2b"
+  top: "res3d_branch2c"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 14.6999998093
+    scale_out: 4.88999986649
+    scale_params: 113.980003357
+  }
+}
+layer {
+  name: "bn3d_branch2c"
+  type: "BatchNorm"
+  bottom: "res3d_branch2c"
+  top: "res3d_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale3d_branch2c"
+  type: "Scale"
+  bottom: "res3d_branch2c"
+  top: "res3d_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res3d"
+  type: "Eltwise"
+  bottom: "res3c_p"
+  bottom: "res3d_branch2c"
+  top: "res3d"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res3d_relu"
+  type: "ReLU"
+  bottom: "res3d"
+  top: "res3d"
+  relu_param {
+  }
+}
+layer {
+  name: "res4a_branch1"
+  type: "Convolution"
+  bottom: "res3d"
+  top: "res4a_branch1"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 9.82999992371
+    scale_out: 4.28000020981
+    scale_params: 213.380004883
+  }
+}
+layer {
+  name: "bn4a_branch1"
+  type: "BatchNorm"
+  bottom: "res4a_branch1"
+  top: "res4a_branch1"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4a_branch1"
+  type: "Scale"
+  bottom: "res4a_branch1"
+  top: "res4a_branch1"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4a_branch2a"
+  type: "Convolution"
+  bottom: "res3d"
+  top: "res4a_branch2a"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 9.82999992371
+    scale_out: 12.3900003433
+    scale_params: 254.339996338
+  }
+}
+layer {
+  name: "bn4a_branch2a"
+  type: "BatchNorm"
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4a_branch2a"
+  type: "Scale"
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4a_branch2a_relu"
+  type: "ReLU"
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4a_branch2b"
+  type: "Convolution"
+  bottom: "res4a_branch2a"
+  top: "res4a_branch2b"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 12.3900003433
+    scale_out: 14.8900003433
+    scale_params: 473.709991455
+  }
+}
+layer {
+  name: "bn4a_branch2b"
+  type: "BatchNorm"
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4a_branch2b"
+  type: "Scale"
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4a_branch2b_relu"
+  type: "ReLU"
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4a_branch2c"
+  type: "Convolution"
+  bottom: "res4a_branch2b"
+  top: "res4a_branch2c"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 14.8900003433
+    scale_out: 4.28000020981
+    scale_params: 75.6200027466
+  }
+}
+layer {
+  name: "bn4a_branch2c"
+  type: "BatchNorm"
+  bottom: "res4a_branch2c"
+  top: "res4a_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4a_branch2c"
+  type: "Scale"
+  bottom: "res4a_branch2c"
+  top: "res4a_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4a"
+  type: "Eltwise"
+  bottom: "res4a_branch1"
+  bottom: "res4a_branch2c"
+  top: "res4a"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res4a_relu"
+  type: "ReLU"
+  bottom: "res4a"
+  top: "res4a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4b_branch2a"
+  type: "Convolution"
+  bottom: "res4a"
+  top: "res4b_branch2a"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 8.60000038147
+    scale_out: 12.0799999237
+    scale_params: 325.369995117
+  }
+}
+layer {
+  name: "bn4b_branch2a"
+  type: "BatchNorm"
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4b_branch2a"
+  type: "Scale"
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4b_branch2a_relu"
+  type: "ReLU"
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4b_branch2b"
+  type: "Convolution"
+  bottom: "res4b_branch2a"
+  top: "res4b_branch2b"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 12.0799999237
+    scale_out: 6.30999994278
+    scale_params: 131.820007324
+  }
+}
+layer {
+  name: "bn4b_branch2b"
+  type: "BatchNorm"
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4b_branch2b"
+  type: "Scale"
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4b_branch2b_relu"
+  type: "ReLU"
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4b_branch2c"
+  type: "Convolution"
+  bottom: "res4b_branch2b"
+  top: "res4b_branch2c"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 6.30999994278
+    scale_out: 4.28000020981
+    scale_params: 67.4400024414
+  }
+}
+layer {
+  name: "bn4b_branch2c"
+  type: "BatchNorm"
+  bottom: "res4b_branch2c"
+  top: "res4b_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4b_branch2c"
+  type: "Scale"
+  bottom: "res4b_branch2c"
+  top: "res4b_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4b"
+  type: "Eltwise"
+  bottom: "res4a"
+  bottom: "res4b_branch2c"
+  top: "res4b"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res4b_relu"
+  type: "ReLU"
+  bottom: "res4b"
+  top: "res4b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4c_branch2a"
+  type: "Convolution"
+  bottom: "res4b"
+  top: "res4c_branch2a"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 8.60000038147
+    scale_out: 11.4099998474
+    scale_params: 369.480010986
+  }
+}
+layer {
+  name: "bn4c_branch2a"
+  type: "BatchNorm"
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4c_branch2a"
+  type: "Scale"
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4c_branch2a_relu"
+  type: "ReLU"
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4c_branch2b"
+  type: "Convolution"
+  bottom: "res4c_branch2a"
+  top: "res4c_branch2b"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 11.4099998474
+    scale_out: 6.90999984741
+    scale_params: 139.050003052
+  }
+}
+layer {
+  name: "bn4c_branch2b"
+  type: "BatchNorm"
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4c_branch2b"
+  type: "Scale"
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4c_branch2b_relu"
+  type: "ReLU"
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4c_branch2c"
+  type: "Convolution"
+  bottom: "res4c_branch2b"
+  top: "res4c_branch2c"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 6.90999984741
+    scale_out: 4.28000020981
+    scale_params: 76.9700012207
+  }
+}
+layer {
+  name: "bn4c_branch2c"
+  type: "BatchNorm"
+  bottom: "res4c_branch2c"
+  top: "res4c_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4c_branch2c"
+  type: "Scale"
+  bottom: "res4c_branch2c"
+  top: "res4c_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4c"
+  type: "Eltwise"
+  bottom: "res4b"
+  bottom: "res4c_branch2c"
+  top: "res4c"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res4c_relu"
+  type: "ReLU"
+  bottom: "res4c"
+  top: "res4c"
+  relu_param {
+  }
+}
+layer {
+  name: "res4d_branch2a"
+  type: "Convolution"
+  bottom: "res4c"
+  top: "res4d_branch2a"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 8.60000038147
+    scale_out: 10.7299995422
+    scale_params: 312.220001221
+  }
+}
+layer {
+  name: "bn4d_branch2a"
+  type: "BatchNorm"
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4d_branch2a"
+  type: "Scale"
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4d_branch2a_relu"
+  type: "ReLU"
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4d_branch2b"
+  type: "Convolution"
+  bottom: "res4d_branch2a"
+  top: "res4d_branch2b"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 10.7299995422
+    scale_out: 5.40000009537
+    scale_params: 201.61000061
+  }
+}
+layer {
+  name: "bn4d_branch2b"
+  type: "BatchNorm"
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4d_branch2b"
+  type: "Scale"
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4d_branch2b_relu"
+  type: "ReLU"
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4d_branch2c"
+  type: "Convolution"
+  bottom: "res4d_branch2b"
+  top: "res4d_branch2c"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 5.40000009537
+    scale_out: 4.28000020981
+    scale_params: 77.1500015259
+  }
+}
+layer {
+  name: "bn4d_branch2c"
+  type: "BatchNorm"
+  bottom: "res4d_branch2c"
+  top: "res4d_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4d_branch2c"
+  type: "Scale"
+  bottom: "res4d_branch2c"
+  top: "res4d_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4d"
+  type: "Eltwise"
+  bottom: "res4c"
+  bottom: "res4d_branch2c"
+  top: "res4d"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res4d_relu"
+  type: "ReLU"
+  bottom: "res4d"
+  top: "res4d"
+  relu_param {
+  }
+}
+layer {
+  name: "res4e_branch2a"
+  type: "Convolution"
+  bottom: "res4d"
+  top: "res4e_branch2a"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 8.60000038147
+    scale_out: 11.75
+    scale_params: 293.720001221
+  }
+}
+layer {
+  name: "bn4e_branch2a"
+  type: "BatchNorm"
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4e_branch2a"
+  type: "Scale"
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4e_branch2a_relu"
+  type: "ReLU"
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4e_branch2b"
+  type: "Convolution"
+  bottom: "res4e_branch2a"
+  top: "res4e_branch2b"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 11.75
+    scale_out: 6.51999998093
+    scale_params: 185.36000061
+  }
+}
+layer {
+  name: "bn4e_branch2b"
+  type: "BatchNorm"
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4e_branch2b"
+  type: "Scale"
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4e_branch2b_relu"
+  type: "ReLU"
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4e_branch2c"
+  type: "Convolution"
+  bottom: "res4e_branch2b"
+  top: "res4e_branch2c"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 6.51999998093
+    scale_out: 4.28000020981
+    scale_params: 98.8199996948
+  }
+}
+layer {
+  name: "bn4e_branch2c"
+  type: "BatchNorm"
+  bottom: "res4e_branch2c"
+  top: "res4e_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4e_branch2c"
+  type: "Scale"
+  bottom: "res4e_branch2c"
+  top: "res4e_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4e"
+  type: "Eltwise"
+  bottom: "res4d"
+  bottom: "res4e_branch2c"
+  top: "res4e"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res4e_relu"
+  type: "ReLU"
+  bottom: "res4e"
+  top: "res4e"
+  relu_param {
+  }
+}
+layer {
+  name: "res4e_p"
+  type: "Pooling"
+  bottom: "res4e"
+  top: "res4e_p"
+  pooling_param {
+    pool: MAX
+    kernel_size: 1
+    stride: 2
+  }
+}
+layer {
+  name: "res4f_branch2a"
+  type: "Convolution"
+  bottom: "res4e"
+  top: "res4f_branch2a"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 8.60000038147
+    scale_out: 16.2900009155
+    scale_params: 300.049987793
+  }
+}
+layer {
+  name: "bn4f_branch2a"
+  type: "BatchNorm"
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4f_branch2a"
+  type: "Scale"
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4f_branch2a_relu"
+  type: "ReLU"
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res4f_branch2b"
+  type: "Convolution"
+  bottom: "res4f_branch2a"
+  top: "res4f_branch2b"
+  convolution_param {
+    num_output: 256
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 2
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 16.2900009155
+    scale_out: 16.6200008392
+    scale_params: 240.550003052
+  }
+}
+layer {
+  name: "bn4f_branch2b"
+  type: "BatchNorm"
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4f_branch2b"
+  type: "Scale"
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4f_branch2b_relu"
+  type: "ReLU"
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res4f_branch2c"
+  type: "Convolution"
+  bottom: "res4f_branch2b"
+  top: "res4f_branch2c"
+  convolution_param {
+    num_output: 1024
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 16.6200008392
+    scale_out: 4.23000001907
+    scale_params: 93.3000030518
+  }
+}
+layer {
+  name: "bn4f_branch2c"
+  type: "BatchNorm"
+  bottom: "res4f_branch2c"
+  top: "res4f_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale4f_branch2c"
+  type: "Scale"
+  bottom: "res4f_branch2c"
+  top: "res4f_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res4f"
+  type: "Eltwise"
+  bottom: "res4e_p"
+  bottom: "res4f_branch2c"
+  top: "res4f"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res4f_relu"
+  type: "ReLU"
+  bottom: "res4f"
+  top: "res4f"
+  relu_param {
+  }
+}
+layer {
+  name: "res5a_branch1"
+  type: "Convolution"
+  bottom: "res4f"
+  top: "res5a_branch1"
+  convolution_param {
+    num_output: 2048
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 8.5
+    scale_out: 0.939999997616
+    scale_params: 45.0
+  }
+}
+layer {
+  name: "bn5a_branch1"
+  type: "BatchNorm"
+  bottom: "res5a_branch1"
+  top: "res5a_branch1"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5a_branch1"
+  type: "Scale"
+  bottom: "res5a_branch1"
+  top: "res5a_branch1"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5a_branch2a"
+  type: "Convolution"
+  bottom: "res4f"
+  top: "res5a_branch2a"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 8.5
+    scale_out: 21.5699996948
+    scale_params: 375.869995117
+  }
+}
+layer {
+  name: "bn5a_branch2a"
+  type: "BatchNorm"
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5a_branch2a"
+  type: "Scale"
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5a_branch2a_relu"
+  type: "ReLU"
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res5a_branch2b"
+  type: "Convolution"
+  bottom: "res5a_branch2a"
+  top: "res5a_branch2b"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 21.5699996948
+    scale_out: 25.2000007629
+    scale_params: 228.160003662
+  }
+}
+layer {
+  name: "bn5a_branch2b"
+  type: "BatchNorm"
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5a_branch2b"
+  type: "Scale"
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5a_branch2b_relu"
+  type: "ReLU"
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res5a_branch2c"
+  type: "Convolution"
+  bottom: "res5a_branch2b"
+  top: "res5a_branch2c"
+  convolution_param {
+    num_output: 2048
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 25.2000007629
+    scale_out: 0.939999997616
+    scale_params: 27.1299991608
+  }
+}
+layer {
+  name: "bn5a_branch2c"
+  type: "BatchNorm"
+  bottom: "res5a_branch2c"
+  top: "res5a_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5a_branch2c"
+  type: "Scale"
+  bottom: "res5a_branch2c"
+  top: "res5a_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5a"
+  type: "Eltwise"
+  bottom: "res5a_branch1"
+  bottom: "res5a_branch2c"
+  top: "res5a"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res5a_relu"
+  type: "ReLU"
+  bottom: "res5a"
+  top: "res5a"
+  relu_param {
+  }
+}
+layer {
+  name: "res5b_branch2a"
+  type: "Convolution"
+  bottom: "res5a"
+  top: "res5b_branch2a"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 1.87999999523
+    scale_out: 25.4400005341
+    scale_params: 999.760009766
+  }
+}
+layer {
+  name: "bn5b_branch2a"
+  type: "BatchNorm"
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5b_branch2a"
+  type: "Scale"
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5b_branch2a_relu"
+  type: "ReLU"
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res5b_branch2b"
+  type: "Convolution"
+  bottom: "res5b_branch2a"
+  top: "res5b_branch2b"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 25.4400005341
+    scale_out: 26.6200008392
+    scale_params: 153.630004883
+  }
+}
+layer {
+  name: "bn5b_branch2b"
+  type: "BatchNorm"
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5b_branch2b"
+  type: "Scale"
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5b_branch2b_relu"
+  type: "ReLU"
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res5b_branch2c"
+  type: "Convolution"
+  bottom: "res5b_branch2b"
+  top: "res5b_branch2c"
+  convolution_param {
+    num_output: 2048
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 26.6200008392
+    scale_out: 0.939999997616
+    scale_params: 35.3400001526
+  }
+}
+layer {
+  name: "bn5b_branch2c"
+  type: "BatchNorm"
+  bottom: "res5b_branch2c"
+  top: "res5b_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5b_branch2c"
+  type: "Scale"
+  bottom: "res5b_branch2c"
+  top: "res5b_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5b"
+  type: "Eltwise"
+  bottom: "res5a"
+  bottom: "res5b_branch2c"
+  top: "res5b"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res5b_relu"
+  type: "ReLU"
+  bottom: "res5b"
+  top: "res5b"
+  relu_param {
+  }
+}
+layer {
+  name: "res5c_branch2a"
+  type: "Convolution"
+  bottom: "res5b"
+  top: "res5c_branch2a"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 1.87999999523
+    scale_out: 21.8099994659
+    scale_params: 1013.09997559
+  }
+}
+layer {
+  name: "bn5c_branch2a"
+  type: "BatchNorm"
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2a"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5c_branch2a"
+  type: "Scale"
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2a"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5c_branch2a_relu"
+  type: "ReLU"
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2a"
+  relu_param {
+  }
+}
+layer {
+  name: "res5c_branch2b"
+  type: "Convolution"
+  bottom: "res5c_branch2a"
+  top: "res5c_branch2b"
+  convolution_param {
+    num_output: 512
+    bias_term: false
+    pad: 1
+    kernel_size: 3
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 21.8099994659
+    scale_out: 14.7100000381
+    scale_params: 321.25
+  }
+}
+layer {
+  name: "bn5c_branch2b"
+  type: "BatchNorm"
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2b"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5c_branch2b"
+  type: "Scale"
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2b"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5c_branch2b_relu"
+  type: "ReLU"
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2b"
+  relu_param {
+  }
+}
+layer {
+  name: "res5c_branch2c"
+  type: "Convolution"
+  bottom: "res5c_branch2b"
+  top: "res5c_branch2c"
+  convolution_param {
+    num_output: 2048
+    bias_term: false
+    pad: 0
+    kernel_size: 1
+    stride: 1
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.20000000298
+    }
+  }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 14.7100000381
+    scale_out: 0.939999997616
+    scale_params: 23.2399997711
+  }
+}
+layer {
+  name: "bn5c_branch2c"
+  type: "BatchNorm"
+  bottom: "res5c_branch2c"
+  top: "res5c_branch2c"
+  batch_norm_param {
+  }
+}
+layer {
+  name: "scale5c_branch2c"
+  type: "Scale"
+  bottom: "res5c_branch2c"
+  top: "res5c_branch2c"
+  scale_param {
+    bias_term: true
+  }
+}
+layer {
+  name: "res5c"
+  type: "Eltwise"
+  bottom: "res5b"
+  bottom: "res5c_branch2c"
+  top: "res5c"
+  eltwise_param {
+  }
+}
+layer {
+  name: "res5c_relu"
+  type: "ReLU"
+  bottom: "res5c"
+  top: "res5c"
+  relu_param {
+  }
+}
+layer {
+  name: "pool5"
+  type: "Pooling"
+  bottom: "res5c"
+  top: "pool5"
+  pooling_param {
+    pool: AVE
+    kernel_size: 7
+    stride: 1
+  }
+}
+layer {
+  name: "fc1000"
+  type: "InnerProduct"
+  bottom: "pool5"
+  top: "fc1000"
+  inner_product_param {
+    num_output: 1000
+    weight_filler {
+      type: "xavier"
+    }
+    bias_filler {
+      type: "constant"
+      value: 0.0
+    }
+  }
+}
+layer {
+  name: "prob"
+  type: "SoftmaxWithLoss"
+  bottom: "fc1000"
+  bottom: "label"
+  top: "prob"
+  include {
+    phase: TRAIN
+  }
+}
+layer {
+  name: "accuracy/top-1"
+  type: "Accuracy"
+  bottom: "fc1000"
+  bottom: "label"
+  top: "accuracy-top1"
+  include {
+    phase: TEST
+  }
+}
+layer {
+  name: "accuracy/top-5"
+  type: "Accuracy"
+  bottom: "fc1000"
+  bottom: "label"
+  top: "accuracy-top5"
+  include {
+    phase: TEST
+  }
+  accuracy_param {
+    top_k: 5
+  }
+}
diff --git a/models/intel_optimized_models/int8/ssd_int8.prototxt b/models/intel_optimized_models/int8/ssd_int8.prototxt
index 583b1962f..26e1a28dc 100644
--- a/models/intel_optimized_models/int8/ssd_int8.prototxt
+++ b/models/intel_optimized_models/int8/ssd_int8.prototxt
@@ -39,12 +39,12 @@ layer {
   bottom: "data"
   top: "conv1_1"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 64
@@ -55,7 +55,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
 }
@@ -71,12 +71,12 @@ layer {
   bottom: "conv1_1"
   top: "conv1_2"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 64
@@ -87,7 +87,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -95,9 +95,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: -2
-    fl_layer_out: -4
-    fl_params: 8
+    scale_in: 0.319999992847
+    scale_out: 0.0799999982119
+    scale_params: 454.859985352
   }
 }
 layer {
@@ -123,12 +123,12 @@ layer {
   bottom: "pool1"
   top: "conv2_1"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 128
@@ -139,7 +139,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -147,9 +147,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: -4
-    fl_layer_out: -5
-    fl_params: 8
+    scale_in: 0.0799999982119
+    scale_out: 0.0599999986589
+    scale_params: 299.019989014
   }
 }
 layer {
@@ -164,12 +164,12 @@ layer {
   bottom: "conv2_1"
   top: "conv2_2"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 128
@@ -180,7 +180,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -188,9 +188,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: -5
-    fl_layer_out: -5
-    fl_params: 9
+    scale_in: 0.0599999986589
+    scale_out: 0.0500000007451
+    scale_params: 540.909973145
   }
 }
 layer {
@@ -216,12 +216,12 @@ layer {
   bottom: "pool2"
   top: "conv3_1"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 256
@@ -232,7 +232,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -240,9 +240,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: -5
-    fl_layer_out: -5
-    fl_params: 8
+    scale_in: 0.0500000007451
+    scale_out: 0.0399999991059
+    scale_params: 256.5
   }
 }
 layer {
@@ -257,12 +257,12 @@ layer {
   bottom: "conv3_1"
   top: "conv3_2"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 256
@@ -273,7 +273,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -281,9 +281,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: -5
-    fl_layer_out: -5
-    fl_params: 8
+    scale_in: 0.0399999991059
+    scale_out: 0.0500000007451
+    scale_params: 306.799987793
   }
 }
 layer {
@@ -298,12 +298,12 @@ layer {
   bottom: "conv3_2"
   top: "conv3_3"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 256
@@ -314,7 +314,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -322,9 +322,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: -5
-    fl_layer_out: -5
-    fl_params: 8
+    scale_in: 0.0500000007451
+    scale_out: 0.0599999986589
+    scale_params: 352.630004883
   }
 }
 layer {
@@ -350,12 +350,12 @@ layer {
   bottom: "pool3"
   top: "conv4_1"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 512
@@ -366,7 +366,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -374,9 +374,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: -5
-    fl_layer_out: -4
-    fl_params: 8
+    scale_in: 0.0599999986589
+    scale_out: 0.0799999982119
+    scale_params: 478.589996338
   }
 }
 layer {
@@ -391,12 +391,12 @@ layer {
   bottom: "conv4_1"
   top: "conv4_2"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 512
@@ -407,7 +407,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -415,9 +415,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: -4
-    fl_layer_out: -3
-    fl_params: 8
+    scale_in: 0.0799999982119
+    scale_out: 0.180000007153
+    scale_params: 485.910003662
   }
 }
 layer {
@@ -432,12 +432,12 @@ layer {
   bottom: "conv4_2"
   top: "conv4_3"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 512
@@ -448,7 +448,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -456,9 +456,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: -3
-    fl_layer_out: -2
-    fl_params: 9
+    scale_in: 0.180000007153
+    scale_out: 0.40000000596
+    scale_params: 552.33001709
   }
 }
 layer {
@@ -484,12 +484,12 @@ layer {
   bottom: "pool4"
   top: "conv5_1"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 512
@@ -500,7 +500,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
     dilation: 1
   }
@@ -509,9 +509,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: -2
-    fl_layer_out: -1
-    fl_params: 9
+    scale_in: 0.40000000596
+    scale_out: 0.550000011921
+    scale_params: 766.260009766
   }
 }
 layer {
@@ -526,12 +526,12 @@ layer {
   bottom: "conv5_1"
   top: "conv5_2"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 512
@@ -542,7 +542,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
     dilation: 1
   }
@@ -551,9 +551,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: -1
-    fl_layer_out: 0
-    fl_params: 9
+    scale_in: 0.550000011921
+    scale_out: 1.16999995708
+    scale_params: 838.429992676
   }
 }
 layer {
@@ -568,12 +568,12 @@ layer {
   bottom: "conv5_2"
   top: "conv5_3"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 512
@@ -584,7 +584,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
     dilation: 1
   }
@@ -593,9 +593,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 0
-    fl_layer_out: 0
-    fl_params: 9
+    scale_in: 1.16999995708
+    scale_out: 1.78999996185
+    scale_params: 717.200012207
   }
 }
 layer {
@@ -622,12 +622,12 @@ layer {
   bottom: "pool5"
   top: "fc6"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 1024
@@ -638,9 +638,8 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
-    engine: CAFFE
     dilation: 6
   }
   quantization_param {
@@ -648,9 +647,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 0
-    fl_layer_out: 2
-    fl_params: 9
+    scale_in: 1.78999996185
+    scale_out: 5.80999994278
+    scale_params: 581.219970703
   }
 }
 layer {
@@ -665,12 +664,12 @@ layer {
   bottom: "fc6"
   top: "fc7"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 1024
@@ -680,7 +679,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -688,9 +687,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 2
-    fl_layer_out: 4
-    fl_params: 9
+    scale_in: 5.80999994278
+    scale_out: 23.5200004578
+    scale_params: 937.08001709
   }
 }
 layer {
@@ -705,12 +704,12 @@ layer {
   bottom: "fc7"
   top: "conv6_1"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 256
@@ -722,7 +721,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -730,9 +729,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 5
-    fl_params: 9
+    scale_in: 23.5200004578
+    scale_out: 41.3400001526
+    scale_params: 590.469970703
   }
 }
 layer {
@@ -747,12 +746,12 @@ layer {
   bottom: "conv6_1"
   top: "conv6_2"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 512
@@ -764,7 +763,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -772,9 +771,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 5
-    fl_layer_out: 5
-    fl_params: 10
+    scale_in: 41.3400001526
+    scale_out: 32.3899993896
+    scale_params: 1789.36999512
   }
 }
 layer {
@@ -789,12 +788,12 @@ layer {
   bottom: "conv6_2"
   top: "conv7_1"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 128
@@ -806,7 +805,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -814,9 +813,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 5
-    fl_layer_out: 4
-    fl_params: 9
+    scale_in: 32.3899993896
+    scale_out: 20.6700000763
+    scale_params: 882.909973145
   }
 }
 layer {
@@ -831,12 +830,12 @@ layer {
   bottom: "conv7_1"
   top: "conv7_2"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 256
@@ -848,7 +847,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -856,9 +855,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 3
-    fl_params: 10
+    scale_in: 20.6700000763
+    scale_out: 14.25
+    scale_params: 1246.82995605
   }
 }
 layer {
@@ -873,12 +872,12 @@ layer {
   bottom: "conv7_2"
   top: "conv8_1"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 128
@@ -890,7 +889,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -898,9 +897,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 4
-    fl_params: 9
+    scale_in: 14.25
+    scale_out: 18.6299991608
+    scale_params: 646.679992676
   }
 }
 layer {
@@ -915,12 +914,12 @@ layer {
   bottom: "conv8_1"
   top: "conv8_2"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 256
@@ -932,7 +931,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -940,9 +939,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 4
-    fl_params: 10
+    scale_in: 18.6299991608
+    scale_out: 18.4300003052
+    scale_params: 1516.22998047
   }
 }
 layer {
@@ -957,12 +956,12 @@ layer {
   bottom: "conv8_2"
   top: "conv9_1"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 128
@@ -974,7 +973,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -982,9 +981,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 4
-    fl_params: 9
+    scale_in: 18.4300003052
+    scale_out: 16.2800006866
+    scale_params: 864.780029297
   }
 }
 layer {
@@ -999,12 +998,12 @@ layer {
   bottom: "conv9_1"
   top: "conv9_2"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 256
@@ -1016,7 +1015,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -1024,9 +1023,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 3
-    fl_params: 10
+    scale_in: 16.2800006866
+    scale_out: 10.6199998856
+    scale_params: 1733.91003418
   }
 }
 layer {
@@ -1044,7 +1043,7 @@ layer {
     across_spatial: false
     scale_filler {
       type: "constant"
-      value: 20
+      value: 20.0
     }
     channel_shared: false
   }
@@ -1055,12 +1054,12 @@ layer {
   bottom: "conv4_3_norm"
   top: "conv4_3_norm_mbox_loc"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 16
@@ -1072,9 +1071,18 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 22.3600006104
+    scale_out: 9.88000011444
+    scale_params: 247.979995728
+  }
 }
 layer {
   name: "conv4_3_norm_mbox_loc_perm"
@@ -1103,12 +1111,12 @@ layer {
   bottom: "conv4_3_norm"
   top: "conv4_3_norm_mbox_conf"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 84
@@ -1120,9 +1128,18 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 22.3600006104
+    scale_out: 9.13000011444
+    scale_params: 793.659973145
+  }
 }
 layer {
   name: "conv4_3_norm_mbox_conf_perm"
@@ -1152,16 +1169,16 @@ layer {
   bottom: "data"
   top: "conv4_3_norm_mbox_priorbox"
   prior_box_param {
-    min_size: 30
-    max_size: 60
-    aspect_ratio: 2
+    min_size: 30.0
+    max_size: 60.0
+    aspect_ratio: 2.0
     flip: true
     clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 8
+    variance: 0.10000000149
+    variance: 0.10000000149
+    variance: 0.20000000298
+    variance: 0.20000000298
+    step: 8.0
     offset: 0.5
   }
 }
@@ -1171,12 +1188,12 @@ layer {
   bottom: "fc7"
   top: "fc7_mbox_loc"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 24
@@ -1188,9 +1205,18 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 23.5200004578
+    scale_out: 28.1800003052
+    scale_params: 1580.34997559
+  }
 }
 layer {
   name: "fc7_mbox_loc_perm"
@@ -1219,12 +1245,12 @@ layer {
   bottom: "fc7"
   top: "fc7_mbox_conf"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 126
@@ -1236,9 +1262,18 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 23.5200004578
+    scale_out: 4.11999988556
+    scale_params: 975.270019531
+  }
 }
 layer {
   name: "fc7_mbox_conf_perm"
@@ -1268,17 +1303,17 @@ layer {
   bottom: "data"
   top: "fc7_mbox_priorbox"
   prior_box_param {
-    min_size: 60
-    max_size: 111
-    aspect_ratio: 2
-    aspect_ratio: 3
+    min_size: 60.0
+    max_size: 111.0
+    aspect_ratio: 2.0
+    aspect_ratio: 3.0
     flip: true
     clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 16
+    variance: 0.10000000149
+    variance: 0.10000000149
+    variance: 0.20000000298
+    variance: 0.20000000298
+    step: 16.0
     offset: 0.5
   }
 }
@@ -1288,12 +1323,12 @@ layer {
   bottom: "conv6_2"
   top: "conv6_2_mbox_loc"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 24
@@ -1305,9 +1340,18 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 32.3899993896
+    scale_out: 30.3400001526
+    scale_params: 1448.85998535
+  }
 }
 layer {
   name: "conv6_2_mbox_loc_perm"
@@ -1336,12 +1380,12 @@ layer {
   bottom: "conv6_2"
   top: "conv6_2_mbox_conf"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 126
@@ -1353,9 +1397,18 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 32.3899993896
+    scale_out: 4.40999984741
+    scale_params: 886.849975586
+  }
 }
 layer {
   name: "conv6_2_mbox_conf_perm"
@@ -1385,17 +1438,17 @@ layer {
   bottom: "data"
   top: "conv6_2_mbox_priorbox"
   prior_box_param {
-    min_size: 111
-    max_size: 162
-    aspect_ratio: 2
-    aspect_ratio: 3
+    min_size: 111.0
+    max_size: 162.0
+    aspect_ratio: 2.0
+    aspect_ratio: 3.0
     flip: true
     clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 32
+    variance: 0.10000000149
+    variance: 0.10000000149
+    variance: 0.20000000298
+    variance: 0.20000000298
+    step: 32.0
     offset: 0.5
   }
 }
@@ -1405,12 +1458,12 @@ layer {
   bottom: "conv7_2"
   top: "conv7_2_mbox_loc"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 24
@@ -1422,9 +1475,18 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 14.25
+    scale_out: 26.8600006104
+    scale_params: 1228.0300293
+  }
 }
 layer {
   name: "conv7_2_mbox_loc_perm"
@@ -1453,12 +1515,12 @@ layer {
   bottom: "conv7_2"
   top: "conv7_2_mbox_conf"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 126
@@ -1470,9 +1532,18 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 14.25
+    scale_out: 4.65999984741
+    scale_params: 896.140014648
+  }
 }
 layer {
   name: "conv7_2_mbox_conf_perm"
@@ -1502,17 +1573,17 @@ layer {
   bottom: "data"
   top: "conv7_2_mbox_priorbox"
   prior_box_param {
-    min_size: 162
-    max_size: 213
-    aspect_ratio: 2
-    aspect_ratio: 3
+    min_size: 162.0
+    max_size: 213.0
+    aspect_ratio: 2.0
+    aspect_ratio: 3.0
     flip: true
     clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 64
+    variance: 0.10000000149
+    variance: 0.10000000149
+    variance: 0.20000000298
+    variance: 0.20000000298
+    step: 64.0
     offset: 0.5
   }
 }
@@ -1522,12 +1593,12 @@ layer {
   bottom: "conv8_2"
   top: "conv8_2_mbox_loc"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 16
@@ -1539,7 +1610,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -1547,9 +1618,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 4
-    fl_layer_out: 5
-    fl_params: 10
+    scale_in: 18.4300003052
+    scale_out: 26.6599998474
+    scale_params: 1359.68994141
   }
 }
 layer {
@@ -1579,12 +1650,12 @@ layer {
   bottom: "conv8_2"
   top: "conv8_2_mbox_conf"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 84
@@ -1596,9 +1667,18 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 18.4300003052
+    scale_out: 5.67999982834
+    scale_params: 1086.95996094
+  }
 }
 layer {
   name: "conv8_2_mbox_conf_perm"
@@ -1628,16 +1708,16 @@ layer {
   bottom: "data"
   top: "conv8_2_mbox_priorbox"
   prior_box_param {
-    min_size: 213
-    max_size: 264
-    aspect_ratio: 2
+    min_size: 213.0
+    max_size: 264.0
+    aspect_ratio: 2.0
     flip: true
     clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 100
+    variance: 0.10000000149
+    variance: 0.10000000149
+    variance: 0.20000000298
+    variance: 0.20000000298
+    step: 100.0
     offset: 0.5
   }
 }
@@ -1647,12 +1727,12 @@ layer {
   bottom: "conv9_2"
   top: "conv9_2_mbox_loc"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 16
@@ -1664,7 +1744,7 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
   quantization_param {
@@ -1672,9 +1752,9 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    fl_layer_in: 3
-    fl_layer_out: 6
-    fl_params: 10
+    scale_in: 10.6199998856
+    scale_out: 35.0900001526
+    scale_params: 1117.32995605
   }
 }
 layer {
@@ -1704,12 +1784,12 @@ layer {
   bottom: "conv9_2"
   top: "conv9_2_mbox_conf"
   param {
-    lr_mult: 1
-    decay_mult: 1
+    lr_mult: 1.0
+    decay_mult: 1.0
   }
   param {
-    lr_mult: 2
-    decay_mult: 0
+    lr_mult: 2.0
+    decay_mult: 0.0
   }
   convolution_param {
     num_output: 84
@@ -1721,9 +1801,18 @@ layer {
     }
     bias_filler {
       type: "constant"
-      value: 0
+      value: 0.0
     }
   }
+  quantization_param {
+    precision: DYNAMIC_FIXED_POINT
+    bw_layer_in: 8
+    bw_layer_out: 8
+    bw_params: 8
+    scale_in: 10.6199998856
+    scale_out: 5.92000007629
+    scale_params: 539.520019531
+  }
 }
 layer {
   name: "conv9_2_mbox_conf_perm"
@@ -1753,16 +1842,16 @@ layer {
   bottom: "data"
   top: "conv9_2_mbox_priorbox"
   prior_box_param {
-    min_size: 264
-    max_size: 315
-    aspect_ratio: 2
+    min_size: 264.0
+    max_size: 315.0
+    aspect_ratio: 2.0
     flip: true
     clip: false
-    variance: 0.1
-    variance: 0.1
-    variance: 0.2
-    variance: 0.2
-    step: 300
+    variance: 0.10000000149
+    variance: 0.10000000149
+    variance: 0.20000000298
+    variance: 0.20000000298
+    step: 300.0
     offset: 0.5
   }
 }
@@ -1818,7 +1907,7 @@ layer {
       dim: 0
       dim: -1
       dim: 21
-    }    
+    }
   }
 }
 layer {
@@ -1854,11 +1943,36 @@ layer {
     share_location: true
     background_label_id: 0
     nms_param {
-      nms_threshold: 0.45
+      nms_threshold: 0.449999988079
       top_k: 400
     }
+    save_output_param {
+      output_directory: "data/ssd_out/VOC2007/SSD_300x300"
+      output_name_prefix: "comp4_det_test_"
+      output_format: "VOC"
+      label_map_file: "data/VOC0712/labelmap_voc.prototxt"
+      name_size_file: "data/VOC0712/test_name_size.txt"
+      num_test_image: 4952
+    }
     code_type: CENTER_SIZE
     keep_top_k: 200
-    confidence_threshold: 0.01
+    confidence_threshold: 0.00999999977648
+  }
+}
+layer {
+  name: "detection_eval"
+  type: "DetectionEvaluate"
+  bottom: "detection_out"
+  bottom: "label"
+  top: "detection_eval"
+  include {
+    phase: TEST
+  }
+  detection_evaluate_param {
+    num_classes: 21
+    background_label_id: 0
+    overlap_threshold: 0.5
+    evaluate_difficult_gt: false
+    name_size_file: "data/VOC0712/test_name_size.txt"
   }
 }

From 29eec8cdbe5725ed1a5a3dec21fbf903b74e2108 Mon Sep 17 00:00:00 2001
From: "Zhang, Guoming" <guoming.zhang@intel.com>
Date: Sun, 7 Jan 2018 23:38:31 +0800
Subject: [PATCH 47/53] Fix for ICL-370, the root cause is we need to check the
 bottom blob is prv or cpu firstly.

---
 src/caffe/layers/mkldnn_convolution_layer.cpp | 16 +++++++++-------
 1 file changed, 9 insertions(+), 7 deletions(-)

diff --git a/src/caffe/layers/mkldnn_convolution_layer.cpp b/src/caffe/layers/mkldnn_convolution_layer.cpp
index 9380afe32..d3f462998 100644
--- a/src/caffe/layers/mkldnn_convolution_layer.cpp
+++ b/src/caffe/layers/mkldnn_convolution_layer.cpp
@@ -207,15 +207,17 @@ void MKLDNNConvolutionLayer<Dtype>::InitConvolutionFwd(const vector<Blob<Dtype>*
     bool is_sum;
     if (bottom.size() > 1) {
       is_sum = true;
-      shared_ptr<MKLDNNMemoryDescriptor<Dtype, false> > bottom_0_desc =
-          get_mkldnn_prv_descriptor<Dtype, false>(bottom[0]);
 
-      shared_ptr<MKLDNNMemoryDescriptor<Dtype, false> > bottom_1_desc =
-          get_mkldnn_prv_descriptor<Dtype, false>(bottom[1]);
+      memory::data_type bottom_1_dt = memory::data_type::f32;
+      if (const_cast<Dtype*>(bottom[1]->prv_data()) != NULL){
+    
+        shared_ptr<MKLDNNMemoryDescriptor<Dtype, false> > bottom_1_desc =
+            get_mkldnn_prv_descriptor<Dtype, false>(bottom[1]);
+        bottom_1_dt = static_cast<memory::data_type>(bottom_1_desc->prv_memory_pd()->desc().data.data_type);
+      } 
 
-      if (top_dt != bottom_1_desc->prv_memory_pd()->desc().data.data_type) {
-        top_dt = static_cast<memory::data_type>(
-            bottom_1_desc->prv_memory_pd()->desc().data.data_type);
+      if (top_dt != bottom_1_dt) {
+        top_dt = bottom_1_dt;
       }
     }
 

From 69b63e7a6bfc3ea3fb4f30b82efed5d9e19cdddd Mon Sep 17 00:00:00 2001
From: "Tian, Feng" <feng.tian@intel.com>
Date: Wed, 10 Jan 2018 11:41:42 +0800
Subject: [PATCH 48/53] update caffe version to 1.1.0

---
 CMakeLists.txt   | 4 ++--
 Makefile         | 4 ++--
 docker/README.md | 2 +-
 3 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 8ab712cf7..9c3253ba5 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -10,8 +10,8 @@ endif()
 project(Caffe C CXX)
 
 # ---[ Caffe version
-set(CAFFE_TARGET_VERSION "1.0.0-rc3" CACHE STRING "Caffe logical version")
-set(CAFFE_TARGET_SOVERSION "1.0.0-rc3" CACHE STRING "Caffe soname version")
+set(CAFFE_TARGET_VERSION "1.1.0" CACHE STRING "Caffe logical version")
+set(CAFFE_TARGET_SOVERSION "1.1.0" CACHE STRING "Caffe soname version")
 add_definitions(-DCAFFE_VERSION=${CAFFE_TARGET_VERSION})
 
 # ---[ Using cmake scripts and modules
diff --git a/Makefile b/Makefile
index f0eb4c71f..5e9d16ad5 100644
--- a/Makefile
+++ b/Makefile
@@ -101,8 +101,8 @@ LIBRARY_NAME := $(PROJECT)
 LIB_BUILD_DIR := $(BUILD_DIR)/lib
 STATIC_NAME := $(LIB_BUILD_DIR)/lib$(LIBRARY_NAME).a
 DYNAMIC_VERSION_MAJOR 		:= 1
-DYNAMIC_VERSION_MINOR 		:= 0
-DYNAMIC_VERSION_REVISION 	:= 0-rc3
+DYNAMIC_VERSION_MINOR 		:= 1
+DYNAMIC_VERSION_REVISION 	:= 0
 DYNAMIC_NAME_SHORT := lib$(LIBRARY_NAME).so
 #DYNAMIC_SONAME_SHORT := $(DYNAMIC_NAME_SHORT).$(DYNAMIC_VERSION_MAJOR)
 DYNAMIC_VERSIONED_NAME_SHORT := $(DYNAMIC_NAME_SHORT).$(DYNAMIC_VERSION_MAJOR).$(DYNAMIC_VERSION_MINOR).$(DYNAMIC_VERSION_REVISION)
diff --git a/docker/README.md b/docker/README.md
index adb893282..f945feabb 100644
--- a/docker/README.md
+++ b/docker/README.md
@@ -17,7 +17,7 @@ docker run -ti caffe:cpu caffe --version
 ```
 which should show a message like:
 ```
-caffe version 1.0.0-rc3
+caffe version 1.1.0
 ```
 
 One can also build and run the Caffe tests in the image using:

From fee2e024c394c7d931de25144ccead4562e05d1b Mon Sep 17 00:00:00 2001
From: "Zhang, Guoming" <guoming.zhang@intel.com>
Date: Thu, 11 Jan 2018 07:51:44 +0800
Subject: [PATCH 49/53] Enhance the accuracy calibration tool with below
 enhancement and fixing. 1.Fixed the unless reorder that raised on resnet and
 inceptionv3. 2.Optimized the parameters for general topology usage. 3.Updated
 the help message for this tool, for the detail usage, please refer to
 https://github.com/intel/caffe/wiki/Introduction-of-Accuracy-Calibration-Tool-for-8-Bit-Inference

---
 scripts/calibrator.py | 218 +++++++++++++++++++++++++++---------------
 1 file changed, 143 insertions(+), 75 deletions(-)

diff --git a/scripts/calibrator.py b/scripts/calibrator.py
index 7dcb7c54a..4bda3bb8d 100644
--- a/scripts/calibrator.py
+++ b/scripts/calibrator.py
@@ -64,23 +64,21 @@ def read_prototxt(prototxt):
     try:
         if not check_existence(prototxt):
             return None
-
         net = caffe_pb2.NetParameter()
-
         with open(prototxt) as f:
             txtf.Merge(f.read(), net)
 
         return net
 
     except Exception as e:
-        raise ("Failed to read {} due to {}".format(prototxt, str(e)))
+        print ("Failed to read {} due to {}".format(prototxt, e))
 
 
-def get_bottom_layers(layer_name, net, start):
+def get_bottom_layers(top_name, net, start):
     bottom_layers = []
     for index, value in enumerate(net.layer[start:]):
         for sub_index, sub_value in enumerate(value.bottom):
-            if sub_value == layer_name:
+            if sub_value == top_name:
                 bottom_layers.append((index, value.name, value.type))
 
     return bottom_layers
@@ -123,9 +121,9 @@ def get_all_top_layers(l, net, end, skip_layers, interesting_layers):
     return all_top_layers
 
 
-def get_all_bottom_layers(layer_name, net, start, skip_layers, interesting_layers):
+def get_all_bottom_layers(top_name, net, start, skip_layers, interesting_layers):
     all_bottom_layers = []
-    bottom_layers = get_bottom_layers(layer_name, net, start)
+    bottom_layers = get_bottom_layers(top_name, net, start)
     while True:
         if len(bottom_layers) == 0:
             break
@@ -149,12 +147,48 @@ def get_all_bottom_layers(layer_name, net, start, skip_layers, interesting_layer
     return all_bottom_layers
 
 
-def transform_convolutions(model_path):
+def get_fusion_conv_names(compiled_model):
+    compiled_net = caffe_pb2.NetParameter()
+    with open(compiled_model) as f:
+        s = f.read()
+        txtf.Merge(s, compiled_net)
+    return [(layer.name, layer.bottom[1]) for _, layer in enumerate(compiled_net.layer)
+            if layer.type == 'Convolution' and len(layer.bottom) > 1]
+
+
+def filter_fusion_layers(net, fusion_layer, conv_layer):
+    if not fusion_layer or not conv_layer:
+        return []
+    interesting_layers = ['ReLU']
+    skip_layers = ['Convolution', 'Eltwise', 'Concat']
+    output_with_relu_layer = [(l.name, net.layer[index].top[0]) for l, index in conv_layer
+                              if len(get_all_bottom_layers(net.layer[index].top[0], net, index + 1,
+                                                           skip_layers, interesting_layers)) == 0]
+    output_without_dict = {v: k for (k, v) in output_with_relu_layer}
+    for layer_name, top_name in fusion_layer:
+        if top_name in output_without_dict.keys():
+            del output_without_dict[top_name]
+
+    return output_without_dict.values()
+
+
+def check_relu_existence(net, start, end, exclude_layer):
+    if net.layer[start].type == 'Convolution' and net.layer[start].name in exclude_layer:
+        return False
+
+    for i in net.layer[start + 1: end]:
+        if i.type == 'ReLU':
+            return True
+    return False
+
+
+def transform_convolutions(model_path, compiled_model_path):
     net = caffe_pb2.NetParameter()
     with open(model_path) as f:
         s = f.read()
         txtf.Merge(s, net)
 
+    fusion_layer = get_fusion_conv_names(compiled_model_path)
     new_net = copy.deepcopy(net)
 
     convolution_layers = [(value, index) for index, value in enumerate(net.layer) if value.type == 'Convolution']
@@ -164,17 +198,18 @@ def transform_convolutions(model_path):
 
     u8_max = 255
     s8_max = 127
-
+    u8_layers = filter_fusion_layers(net, fusion_layer, convolution_layers)
     for (l, index) in convolution_layers:
-        outputwith_relu = get_all_bottom_layers(l.name, net, index + 1, skip_layers, interesting_layers)
+        outputwith_relu = get_all_bottom_layers(net.layer[index].top[0], net, index + 1, skip_layers,
+                                                interesting_layers)
+        conv_relu_flag = check_relu_existence(net, index,
+                                              convolution_layers[convolution_layers.index((l, index)) + 1][1]
+                                              if (l, index) != convolution_layers[-1]
+                                              else len(net.layer), [i[0] for i in fusion_layer])
         inputwith_relu = get_all_top_layers(l, net, index, skip_layers, interesting_layers)
-        # print "Processing", l.type, l.name
-
-        # output_type = 'u8' if outputwith_relu else 's8'
-        # input_type = 'u8' if inputwith_relu else 's8'
 
         for si in range(0, len(new_net.layer[index].quantization_param.scale_out)):
-            if len(outputwith_relu) > 0:  # u8
+            if len(outputwith_relu) > 0 or l.name in u8_layers or conv_relu_flag:  # u8
                 new_net.layer[index].quantization_param.scale_out[si] = round(u8_max / new_net.layer[index].
                                                                               quantization_param.scale_out[si], 2)
             else:  # s8
@@ -182,12 +217,12 @@ def transform_convolutions(model_path):
                                                                               quantization_param.scale_out[si], 2)
 
         for si in range(0, len(new_net.layer[index].quantization_param.scale_in)):
-            if len(inputwith_relu) > 0:  # u8
+            if len(inputwith_relu) > 0 or l.type == 'Convolution':  # u8
                 new_net.layer[index].quantization_param.scale_in[si] = round(u8_max / new_net.layer[index].
                                                                              quantization_param.scale_in[si], 2)
-            else:  # s8
-                new_net.layer[index].quantization_param.scale_in[si] = round(s8_max / new_net.layer[index].
-                                                                             quantization_param.scale_in[si], 2)
+            else:
+                new_net.layer[index].ClearField('quantization_param')
+                continue
 
         for si in range(0, len(new_net.layer[index].quantization_param.scale_params)):
             new_net.layer[index].quantization_param.scale_params[si] = round(s8_max / new_net.layer[index].
@@ -198,39 +233,51 @@ def transform_convolutions(model_path):
 
 
 def generate_sample(sample_path, input_model, weights,
-                    quantized_model, model_type, iterations=1, error_margin=1, power=0):
+                    quantized_model, detection, iterations=1, error_margin=1, power=0):
     cmd = '{0} quantize -model {1} -weights {2} -model_quantized {3} -iterations {4} ' \
           '-trimming_mode dynamic_fixed_point -error_margin {5} -power {6}'.format(sample_path, input_model, weights,
                                                                                    quantized_model, iterations,
                                                                                    error_margin, power)
-    if model_type == 3:
+    if detection:
         cmd += ' --detection=1'
 
     os.system(cmd)
 
 
-def get_the_accuracy(caffe_bin, model_def, model_weights, iterations, model_type):
+def get_compiled_net(caffe_bin, model_def, model_weights, detection):
+    output_log_name = '.compiled_net.txt'
+
+    cmd = '{} test -model {} -weights {} -iterations 1'.format(caffe_bin, model_def, model_weights)
+    if detection:
+        cmd += ' -detection'
+    cmd += ' 2>&1 > {}'.format(output_log_name)
+
+    os.system(cmd)
+    return os.path.abspath(output_log_name)
+
+
+def get_the_accuracy(caffe_bin, model_def, model_weights, iterations, detection, blob_name):
     output_log_name = 'calibrator_log.txt'
     cmd = '{} test -model {} -weights {} -iterations {}'.format(caffe_bin, model_def, model_weights, iterations)
-    if model_type == 3:
+    if detection:
         cmd += ' -detection'
     cmd += ' 2>&1|tee {}'.format(output_log_name)
+
     os.system(cmd)
+
     with open(output_log_name) as f:
         data = f.readlines()
-    try:
-        if model_type == 1:
-            top_1 = data[-2].strip()
-            return float(top_1.split('=')[-1].strip())
-        elif model_type == 2:
-            top_1 = data[-3].strip()
-            return float(top_1.split('=')[-1].strip())
-        elif model_type == 3:
-            top_1 = data[-1].strip()
-            return float(top_1.split('=')[-1].strip())
-    except Exception as e:
-        print 'Failed to generate accuracy due to {}'.format(str(e))
-        sys.exit(-1)
+
+    for i in data[::-1]:
+        if i.find('{} = '.format(blob_name)) != -1:
+            try:
+                return float(i.split('=')[-1].strip())
+            except Exception as e:
+                print 'Failed to generate accuracy due to {}'.format(str(e))
+                sys.exit(-1)
+
+    print 'Failed to get accuracy, please check the parameters and rerun the scripts.'
+    sys.exit(-1)
 
 
 def remove_top_quantized_parameter(current_quantized_file):
@@ -244,17 +291,33 @@ def remove_top_quantized_parameter(current_quantized_file):
         f.write(str(net))
 
 
-def tuning_quantized_topology(base_top1_accuracy, quantized_file, caffe_bin, model_weights, iterations,
-                              enable_floating_point, toleration, model_type):
-    if enable_floating_point == 0:
+def tuning_quantized_topology(base_top1_accuracy, prototxt, caffe_bin, model_weights, iterations,
+                              is_floating_point, accuracy_loss, detection, blob_name):
+    if is_floating_point == 0:
         print 'Updating quantization parameter...'
-        transform_convolutions(quantized_file)
-    current_top1_accuracy = get_the_accuracy(caffe_bin, quantized_file, model_weights, iterations, model_type)
-    while abs(current_top1_accuracy - base_top1_accuracy) >= toleration:
+
+        transform_convolutions(prototxt, get_compiled_net(caffe_bin, prototxt, model_weights, detection))
+
+    current_top1_accuracy = get_the_accuracy(caffe_bin, prototxt, model_weights, iterations, detection, blob_name)
+
+    while abs(current_top1_accuracy - base_top1_accuracy) >= accuracy_loss:
         print 'Tuning... '
         print abs(current_top1_accuracy - base_top1_accuracy)
-        remove_top_quantized_parameter(quantized_file)
-        current_top1_accuracy = get_the_accuracy(caffe_bin, quantized_prototxt, model_weights, iterations, model_type)
+        remove_top_quantized_parameter(prototxt)
+        current_top1_accuracy = get_the_accuracy(caffe_bin, prototxt, model_weights, iterations, detection, blob_name)
+
+
+def check_blob_name_existence(prototxt, blob_name):
+    net = read_prototxt(prototxt)
+    if not net.layer:
+        print 'Please check the model prototxt integrity.'
+        sys.exit(-1)
+
+    for i in net.layer[::-1]:
+        for _, value in enumerate(i.top):
+            if value == blob_name:
+                return True
+    return False
 
 
 if __name__ == '__main__':
@@ -265,36 +328,41 @@ def tuning_quantized_topology(base_top1_accuracy, quantized_file, caffe_bin, mod
                    ' -w pre-trained-fp32 weights ' \
                    ' -m typology ' \
                    ' -i iterations ' \
-                   ' -t resnet|inceptionv3|ssd\n '
+                   ' -l acceptable accuracy loss value, the default value is 0.01(stands for 1%)' \
+                   ' -d 1(0 means classification while 1 means detection, the default value is 0' \
+                   ' -n blob name which means accuracy.\n '
 
     parser = argparse.ArgumentParser(add_help=False)
     parser.add_argument('-h', '--help', action='help', help=usage_string)
 
     parser.add_argument('-i', '--iterations', action='store', dest='iterations', default=10,
-                        help='iterations')
+                        help='equal to the number to complete one epoch.')
 
     parser.add_argument('-w', '--weights', action='store', dest='weights', default='',
-                        help='pre-trained-fp32-weights')
+                        help='pre-trained-fp32-weights.')
 
     parser.add_argument('-m', '--model', action='store', dest='model', default='',
-                        help='model')
+                        help='topology definition prototxt.')
 
     parser.add_argument('-l', '--accuracy_loss', action='store', dest='loss', default=0.01,
-                        help='accuracy-loss')
+                        help='the acceptable accuracy loss that raised by 8-Bit quantization, '
+                             'default value is 0.01(1%).')
 
-    parser.add_argument('-t', '--type', action='store', dest='input_model_type', default='',
-                        help='model type')
+    parser.add_argument('-d', '--detection', action='store', dest='is_detection', default=0,
+                        help='0 for classification while 1 for detection, default value is 0.')
 
     parser.add_argument('-r', '--root', action='store', dest='root', default='',
                         help='caffe build path')
-    
+
+    parser.add_argument('-n', '--blob_name', action='store', dest='blob_name', default='',
+                        help='top blob name which stands for accuracy')
     params = parser.parse_args()
 
     try:
-        iterations = int(params.iterations)
+        user_input_iterations = int(params.iterations)
     except:
         print 'Set the iterations to the default value 1000'
-        iterations = 1000
+        user_input_iterations = 1000
 
     try:
         toleration = float(params.loss)
@@ -304,41 +372,41 @@ def tuning_quantized_topology(base_top1_accuracy, quantized_file, caffe_bin, mod
         print 'Set the toleration to 1%.'
         toleration = 0.01
 
+    try:
+        detection_flag = 1 if int(params.is_detection) == 1 else 0
+    except:
+        print 'Set the test type to classification.'
+        detection_flag = 0
+
     model = os.path.abspath(params.model)
-    weights = os.path.abspath(params.weights)
+    user_input_weights = os.path.abspath(params.weights)
     sample = os.path.abspath(params.root + 'tools/sample')
-    caffe_bin = os.path.abspath(params.root + 'tools/caffe')
+    caffe_bin_path = os.path.abspath(params.root + 'tools/caffe')
     setup_env()
 
-    if params.input_model_type == 'resnet':
-        model_type = 1
-    elif params.input_model_type == 'inceptionv3':
-        model_type = 2
-    elif params.input_model_type == 'ssd':
-        model_type = 3
-    else:
-        print 'Invalid model type!'
+    if not check_existence(model) or not check_existence(user_input_weights) or not check_existence(sample) \
+            or not check_existence(caffe_bin_path):
+        print 'Please check model/weights/sample existence.'
         sys.exit(-1)
 
-    if check_existence(model) is False or check_existence(weights) is False or check_existence(sample) is False or \
-            check_existence(caffe_bin) is False:
-        print 'Please check model/weights/sample existence.'
+    target_blob_name = params.blob_name
+    if not target_blob_name or not check_blob_name_existence(model, target_blob_name):
+        print 'Please specify valid blob name and rerun the script.'
         sys.exit(-1)
 
     sys.path.insert(0, params.root + '../python')
     quantized_prototxt = model.rsplit('.')[0] + '_quantized.prototxt'
-    quantized_weights = weights.rsplit('.')[0] + '_quantized.caffemodel'
+    quantized_weights = user_input_weights.rsplit('.')[0] + '_quantized.caffemodel'
     enable_floating_point = 0
     print 'Sampling...'
-    generate_sample(sample, model, weights,
-                    quantized_prototxt, model_type, 10, 100 * toleration, enable_floating_point)
-
+    generate_sample(sample, model, user_input_weights,
+                    quantized_prototxt, detection_flag, 10, 100 * toleration, enable_floating_point)
     print 'Sampling done'
     print 'Generating the FP32 accuracy...'
-    top_1 = get_the_accuracy(caffe_bin, model, weights, iterations, model_type)
+    top_1 = get_the_accuracy(caffe_bin_path, model, user_input_weights, user_input_iterations, detection_flag,
+                             target_blob_name)
     print 'FP32 accuracy is: {}'.format(top_1)
-
-    tuning_quantized_topology(top_1, quantized_prototxt, caffe_bin, weights, iterations, enable_floating_point,
-                              toleration, model_type)
+    tuning_quantized_topology(top_1, quantized_prototxt, caffe_bin_path, user_input_weights, user_input_iterations,
+                              enable_floating_point, toleration, detection_flag, target_blob_name)
 
     print 'Updated prototxt {} is generated.'.format(quantized_prototxt)

From 187c913200c41ffb12876d4001eae37d5548174d Mon Sep 17 00:00:00 2001
From: Shane Li <shane.li@intel.com>
Date: Thu, 11 Jan 2018 22:01:17 +0800
Subject: [PATCH 50/53] Add benchmarking descriptions into resnet_50 solver
 prototxt file

---
 models/intel_optimized_models/resnet_50/solver.prototxt | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/models/intel_optimized_models/resnet_50/solver.prototxt b/models/intel_optimized_models/resnet_50/solver.prototxt
index bf9922187..5693483fd 100644
--- a/models/intel_optimized_models/resnet_50/solver.prototxt
+++ b/models/intel_optimized_models/resnet_50/solver.prototxt
@@ -1,3 +1,4 @@
+#The prototxt files(solver.prototxt and train_val.prototxt) are copied from "models/intel_optimized_models/multinode/resnet_50_16_nodes_2k_batch", temporarily used for throughput benchmarking. It can't achieve expected accuracy for training. We'll provide the files for single node training in the future.
 net: "models/intel_optimized_models/resnet_50/train_val.prototxt"
 test_iter: 1000
 test_interval: 625
@@ -9,11 +10,9 @@ stepvalue:18750
 stepvalue:37500
 stepvalue:50000
 gamma: 0.1
-max_iter: 56300
+max_iter: 200
 warmup_iter: 3125 # 1281167 / 2048 * 5 epochs
 warmup_start_lr: 0.1
 momentum: 0.9
 weight_decay: 0.0001
-snapshot: 6250
-snapshot_prefix: "models/intel_optimized_models/resnet_50/resnet_50_"
 solver_mode: CPU

From 17829ddfe09b8cb22a5e420cbf4c8857c0bd013f Mon Sep 17 00:00:00 2001
From: xiaolil1 <xiaoli.liu@intel.com>
Date: Fri, 12 Jan 2018 16:01:07 +0800
Subject: [PATCH 51/53] update models for int8

---
 .../int8/inceptionv3_int8.prototxt            | 290 ++++++++----------
 .../int8/resnet50_int8.prototxt               |  63 ++--
 .../int8/resnet50_sparse_int8.prototxt        |  67 ++--
 .../int8/ssd_int8.prototxt                    |  27 +-
 4 files changed, 172 insertions(+), 275 deletions(-)

diff --git a/models/intel_optimized_models/int8/inceptionv3_int8.prototxt b/models/intel_optimized_models/int8/inceptionv3_int8.prototxt
index 70a52b698..40a810628 100644
--- a/models/intel_optimized_models/int8/inceptionv3_int8.prototxt
+++ b/models/intel_optimized_models/int8/inceptionv3_int8.prototxt
@@ -1,3 +1,4 @@
+# For INT8 reference
 name: "InceptionV3"
 layer {
   name: "data"
@@ -90,7 +91,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 75.3399963379
-    scale_out: 24.3700008392
+    scale_out: 48.9399986267
     scale_params: 125.419998169
   }
 }
@@ -134,7 +135,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 48.9399986267
-    scale_out: 33.9199981689
+    scale_out: 68.1200027466
     scale_params: 238.300003052
   }
 }
@@ -190,7 +191,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 68.1200027466
-    scale_out: 37.0099983215
+    scale_out: 74.3199996948
     scale_params: 115.459999084
   }
 }
@@ -234,7 +235,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 74.3199996948
-    scale_out: 61.7999992371
+    scale_out: 124.080001831
     scale_params: 490.480010986
   }
 }
@@ -290,7 +291,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 124.080001831
-    scale_out: 62.7400016785
+    scale_out: 125.970001221
     scale_params: 239.179992676
   }
 }
@@ -334,7 +335,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 124.080001831
-    scale_out: 79.2399978638
+    scale_out: 159.11000061
     scale_params: 303.589996338
   }
 }
@@ -378,7 +379,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 159.11000061
-    scale_out: 69.2699966431
+    scale_out: 139.080001831
     scale_params: 495.859985352
   }
 }
@@ -422,7 +423,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 124.080001831
-    scale_out: 72.8399963379
+    scale_out: 146.25
     scale_params: 215.38999939
   }
 }
@@ -466,7 +467,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 146.25
-    scale_out: 85.2699966431
+    scale_out: 171.210006714
     scale_params: 322.309997559
   }
 }
@@ -510,7 +511,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 171.210006714
-    scale_out: 57.8400001526
+    scale_out: 116.150001526
     scale_params: 303.209991455
   }
 }
@@ -566,7 +567,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 164.720001221
-    scale_out: 87.5400009155
+    scale_out: 175.770004272
     scale_params: 160.130004883
   }
 }
@@ -621,8 +622,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 57.8400001526
-    scale_out: 63.8800010681
+    scale_in: 116.150001526
+    scale_out: 128.270004272
     scale_params: 229.300003052
   }
 }
@@ -665,8 +666,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 57.8400001526
-    scale_out: 48.7599983215
+    scale_in: 116.150001526
+    scale_out: 97.9100036621
     scale_params: 171.490005493
   }
 }
@@ -710,7 +711,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 97.9100036621
-    scale_out: 54.2099990845
+    scale_out: 108.839996338
     scale_params: 516.630004883
   }
 }
@@ -753,8 +754,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 57.8400001526
-    scale_out: 77.5999984741
+    scale_in: 116.150001526
+    scale_out: 155.809997559
     scale_params: 194.460006714
   }
 }
@@ -798,7 +799,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 155.809997559
-    scale_out: 100.75
+    scale_out: 202.300003052
     scale_params: 243.229995728
   }
 }
@@ -842,7 +843,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 202.300003052
-    scale_out: 52.8199996948
+    scale_out: 106.050003052
     scale_params: 90.2200012207
   }
 }
@@ -897,8 +898,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 80.2900009155
-    scale_out: 100.050003052
+    scale_in: 161.210006714
+    scale_out: 200.88999939
     scale_params: 146.809997559
   }
 }
@@ -953,8 +954,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 52.8199996948
-    scale_out: 78.9400024414
+    scale_in: 106.050003052
+    scale_out: 158.509994507
     scale_params: 251.970001221
   }
 }
@@ -997,8 +998,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 52.8199996948
-    scale_out: 50.7700004578
+    scale_in: 106.050003052
+    scale_out: 101.940002441
     scale_params: 211.789993286
   }
 }
@@ -1042,7 +1043,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 101.940002441
-    scale_out: 62.0
+    scale_out: 124.5
     scale_params: 537.25
   }
 }
@@ -1085,8 +1086,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 52.8199996948
-    scale_out: 80.1200027466
+    scale_in: 106.050003052
+    scale_out: 160.86000061
     scale_params: 225.440002441
   }
 }
@@ -1130,7 +1131,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 160.86000061
-    scale_out: 62.7799987793
+    scale_out: 126.050003052
     scale_params: 141.570007324
   }
 }
@@ -1174,7 +1175,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 126.050003052
-    scale_out: 65.6800003052
+    scale_out: 131.869995117
     scale_params: 423.859985352
   }
 }
@@ -1229,8 +1230,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 85.0
-    scale_out: 95.9300003052
+    scale_in: 170.679992676
+    scale_out: 192.61000061
     scale_params: 127.099998474
   }
 }
@@ -1285,8 +1286,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 62.0
-    scale_out: 76.8199996948
+    scale_in: 124.5
+    scale_out: 154.25
     scale_params: 251.36000061
   }
 }
@@ -1329,8 +1330,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 62.0
-    scale_out: 96.2900009155
+    scale_in: 124.5
+    scale_out: 193.350006104
     scale_params: 278.760009766
   }
 }
@@ -1374,7 +1375,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 193.350006104
-    scale_out: 132.729995728
+    scale_out: 266.5
     scale_params: 457.459991455
   }
 }
@@ -1418,7 +1419,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 266.5
-    scale_out: 58.7700004578
+    scale_out: 118.0
     scale_params: 270.910003662
   }
 }
@@ -1484,8 +1485,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 58.7700004578
-    scale_out: 75.8399963379
+    scale_in: 118.0
+    scale_out: 152.289993286
     scale_params: 153.630004883
   }
 }
@@ -1528,8 +1529,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 58.7700004578
-    scale_out: 55.1300010681
+    scale_in: 118.0
+    scale_out: 110.699996948
     scale_params: 182.440002441
   }
 }
@@ -1575,7 +1576,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 110.699996948
-    scale_out: 48.0499992371
+    scale_out: 96.4899978638
     scale_params: 157.910003662
   }
 }
@@ -1621,7 +1622,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 96.4899978638
-    scale_out: 62.3899993896
+    scale_out: 125.279998779
     scale_params: 241.160003662
   }
 }
@@ -1664,8 +1665,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 58.7700004578
-    scale_out: 145.690002441
+    scale_in: 118.0
+    scale_out: 292.529998779
     scale_params: 284.149993896
   }
 }
@@ -1711,7 +1712,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 292.529998779
-    scale_out: 125.720001221
+    scale_out: 252.419998169
     scale_params: 290.660003662
   }
 }
@@ -1757,7 +1758,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 252.419998169
-    scale_out: 69.25
+    scale_out: 139.050003052
     scale_params: 173.460006714
   }
 }
@@ -1803,7 +1804,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 139.050003052
-    scale_out: 79.2600021362
+    scale_out: 159.149993896
     scale_params: 185.009994507
   }
 }
@@ -1849,7 +1850,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 159.149993896
-    scale_out: 76.5999984741
+    scale_out: 153.809997559
     scale_params: 206.669998169
   }
 }
@@ -1904,8 +1905,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 100.790000916
-    scale_out: 93.4000015259
+    scale_in: 202.369995117
+    scale_out: 187.529998779
     scale_params: 116.709999084
   }
 }
@@ -1960,8 +1961,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 62.3899993896
-    scale_out: 69.3000030518
+    scale_in: 125.279998779
+    scale_out: 139.149993896
     scale_params: 192.5
   }
 }
@@ -2004,8 +2005,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 62.3899993896
-    scale_out: 54.7299995422
+    scale_in: 125.279998779
+    scale_out: 109.88999939
     scale_params: 252.080001831
   }
 }
@@ -2051,7 +2052,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 109.88999939
-    scale_out: 54.1800003052
+    scale_out: 108.779998779
     scale_params: 196.350006104
   }
 }
@@ -2097,7 +2098,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 108.779998779
-    scale_out: 47.1699981689
+    scale_out: 94.7200012207
     scale_params: 218.880004883
   }
 }
@@ -2140,8 +2141,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 62.3899993896
-    scale_out: 107.379997253
+    scale_in: 125.279998779
+    scale_out: 215.61000061
     scale_params: 294.489990234
   }
 }
@@ -2187,7 +2188,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 215.61000061
-    scale_out: 72.3499984741
+    scale_out: 145.259994507
     scale_params: 186.509994507
   }
 }
@@ -2233,7 +2234,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 145.259994507
-    scale_out: 62.2599983215
+    scale_out: 125.019996643
     scale_params: 243.020004272
   }
 }
@@ -2279,7 +2280,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 125.019996643
-    scale_out: 82.0299987793
+    scale_out: 164.699996948
     scale_params: 320.420013428
   }
 }
@@ -2325,7 +2326,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 164.699996948
-    scale_out: 78.0699996948
+    scale_out: 156.759994507
     scale_params: 216.5
   }
 }
@@ -2380,8 +2381,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 101.949996948
-    scale_out: 64.6999969482
+    scale_in: 204.699996948
+    scale_out: 129.899993896
     scale_params: 149.190002441
   }
 }
@@ -2436,8 +2437,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 47.1699981689
-    scale_out: 67.3399963379
+    scale_in: 94.7200012207
+    scale_out: 135.210006714
     scale_params: 165.38999939
   }
 }
@@ -2480,8 +2481,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 47.1699981689
-    scale_out: 72.6299972534
+    scale_in: 94.7200012207
+    scale_out: 145.830001831
     scale_params: 194.589996338
   }
 }
@@ -2527,7 +2528,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 145.830001831
-    scale_out: 71.2099990845
+    scale_out: 142.979995728
     scale_params: 200.419998169
   }
 }
@@ -2573,7 +2574,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 142.979995728
-    scale_out: 71.7600021362
+    scale_out: 144.089996338
     scale_params: 248.820007324
   }
 }
@@ -2616,8 +2617,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 47.1699981689
-    scale_out: 89.7200012207
+    scale_in: 94.7200012207
+    scale_out: 180.13999939
     scale_params: 276.739990234
   }
 }
@@ -2663,7 +2664,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 180.13999939
-    scale_out: 51.8300018311
+    scale_out: 104.069999695
     scale_params: 231.600006104
   }
 }
@@ -2709,7 +2710,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 104.069999695
-    scale_out: 58.4500007629
+    scale_out: 117.370002747
     scale_params: 192.809997559
   }
 }
@@ -2755,7 +2756,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 117.370002747
-    scale_out: 54.4000015259
+    scale_out: 109.230003357
     scale_params: 210.199996948
   }
 }
@@ -2801,7 +2802,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 109.230003357
-    scale_out: 86.8899993896
+    scale_out: 174.460006714
     scale_params: 312.559997559
   }
 }
@@ -2856,8 +2857,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 72.2799987793
-    scale_out: 104.019996643
+    scale_in: 145.119995117
+    scale_out: 208.850006104
     scale_params: 119.339996338
   }
 }
@@ -2912,8 +2913,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 67.3399963379
-    scale_out: 67.4499969482
+    scale_in: 135.210006714
+    scale_out: 135.440002441
     scale_params: 252.38999939
   }
 }
@@ -2956,8 +2957,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 67.3399963379
-    scale_out: 64.8700027466
+    scale_in: 135.210006714
+    scale_out: 130.25
     scale_params: 369.850006104
   }
 }
@@ -3003,7 +3004,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 130.25
-    scale_out: 52.3899993896
+    scale_out: 105.180000305
     scale_params: 260.700012207
   }
 }
@@ -3049,7 +3050,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 105.180000305
-    scale_out: 76.4199981689
+    scale_out: 153.440002441
     scale_params: 316.489990234
   }
 }
@@ -3092,8 +3093,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 67.3399963379
-    scale_out: 80.0599975586
+    scale_in: 135.210006714
+    scale_out: 160.740005493
     scale_params: 264.869995117
   }
 }
@@ -3139,7 +3140,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 160.740005493
-    scale_out: 72.5599975586
+    scale_out: 145.690002441
     scale_params: 273.700012207
   }
 }
@@ -3185,7 +3186,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 145.690002441
-    scale_out: 67.7699966431
+    scale_out: 136.080001831
     scale_params: 273.950012207
   }
 }
@@ -3231,7 +3232,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 136.080001831
-    scale_out: 68.7900009155
+    scale_out: 138.130004883
     scale_params: 271.679992676
   }
 }
@@ -3277,7 +3278,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 138.130004883
-    scale_out: 83.0400009155
+    scale_out: 166.729995728
     scale_params: 331.309997559
   }
 }
@@ -3332,8 +3333,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 116.220001221
-    scale_out: 93.6600036621
+    scale_in: 233.350006104
+    scale_out: 188.050003052
     scale_params: 129.759994507
   }
 }
@@ -3388,8 +3389,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 67.4499969482
-    scale_out: 75.5800018311
+    scale_in: 135.440002441
+    scale_out: 151.75
     scale_params: 245.309997559
   }
 }
@@ -3433,7 +3434,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 151.75
-    scale_out: 40.4199981689
+    scale_out: 81.1500015259
     scale_params: 171.190002441
   }
 }
@@ -3476,8 +3477,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 67.4499969482
-    scale_out: 73.7399978638
+    scale_in: 135.440002441
+    scale_out: 148.070007324
     scale_params: 135.559997559
   }
 }
@@ -3523,7 +3524,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 148.070007324
-    scale_out: 57.2099990845
+    scale_out: 114.86000061
     scale_params: 123.540000916
   }
 }
@@ -3569,7 +3570,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 114.86000061
-    scale_out: 96.2099990845
+    scale_out: 193.179992676
     scale_params: 310.769989014
   }
 }
@@ -3613,7 +3614,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 193.179992676
-    scale_out: 67.4700012207
+    scale_out: 135.479995728
     scale_params: 313.369995117
   }
 }
@@ -3680,8 +3681,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 40.4199981689
-    scale_out: 156.029998779
+    scale_in: 81.1500015259
+    scale_out: 313.279998779
     scale_params: 400.739990234
   }
 }
@@ -3724,8 +3725,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 40.4199981689
-    scale_out: 87.5299987793
+    scale_in: 81.1500015259
+    scale_out: 175.759994507
     scale_params: 289.25
   }
 }
@@ -3771,7 +3772,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 175.759994507
-    scale_out: 103.349998474
+    scale_out: 207.509994507
     scale_params: 346.429992676
   }
 }
@@ -3817,7 +3818,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 175.759994507
-    scale_out: 93.3399963379
+    scale_out: 187.419998169
     scale_params: 263.369995117
   }
 }
@@ -3860,8 +3861,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 40.4199981689
-    scale_out: 70.1999969482
+    scale_in: 81.1500015259
+    scale_out: 140.960006714
     scale_params: 241.759994507
   }
 }
@@ -3905,7 +3906,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 140.960006714
-    scale_out: 63.2599983215
+    scale_out: 127.019996643
     scale_params: 514.510009766
   }
 }
@@ -3951,7 +3952,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 127.019996643
-    scale_out: 98.9100036621
+    scale_out: 198.600006104
     scale_params: 570.369995117
   }
 }
@@ -3997,7 +3998,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 127.019996643
-    scale_out: 99.2799987793
+    scale_out: 199.339996338
     scale_params: 365.929992676
   }
 }
@@ -4052,8 +4053,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 75.75
-    scale_out: 153.800003052
+    scale_in: 152.100006104
+    scale_out: 308.799987793
     scale_params: 119.88999939
   }
 }
@@ -4111,8 +4112,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 93.3399963379
-    scale_out: 16.8299999237
+    scale_in: 187.419998169
+    scale_out: 33.7900009155
     scale_params: 19.4200000763
   }
 }
@@ -4155,8 +4156,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 93.3399963379
-    scale_out: 61.1500015259
+    scale_in: 187.419998169
+    scale_out: 122.779998779
     scale_params: 105.769996643
   }
 }
@@ -4202,7 +4203,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 122.779998779
-    scale_out: 9.39999961853
+    scale_out: 18.8600006104
     scale_params: 35.6800003052
   }
 }
@@ -4248,7 +4249,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 122.779998779
-    scale_out: 9.22000026703
+    scale_out: 18.5200004578
     scale_params: 37.3199996948
   }
 }
@@ -4291,8 +4292,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 93.3399963379
-    scale_out: 60.1800003052
+    scale_in: 187.419998169
+    scale_out: 120.839996338
     scale_params: 92.4100036621
   }
 }
@@ -4336,7 +4337,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 120.839996338
-    scale_out: 94.8700027466
+    scale_out: 190.479995728
     scale_params: 345.420013428
   }
 }
@@ -4382,7 +4383,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 190.479995728
-    scale_out: 8.35000038147
+    scale_out: 16.7700004578
     scale_params: 44.3199996948
   }
 }
@@ -4428,7 +4429,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 190.479995728
-    scale_out: 10.9600000381
+    scale_out: 22.0100002289
     scale_params: 44.2700004578
   }
 }
@@ -4483,8 +4484,8 @@ layer {
     bw_layer_in: 8
     bw_layer_out: 8
     bw_params: 8
-    scale_in: 93.3399963379
-    scale_out: 19.9799995422
+    scale_in: 187.419998169
+    scale_out: 40.1100006104
     scale_params: 81.5699996948
   }
 }
@@ -4567,33 +4568,4 @@ layer {
     }
   }
 }
-layer {
-  name: "loss"
-  type: "SoftmaxWithLoss"
-  bottom: "fc1"
-  bottom: "label"
-  top: "loss"
-}
-layer {
-  name: "acc/top-1"
-  type: "Accuracy"
-  bottom: "fc1"
-  bottom: "label"
-  top: "acc/top-1"
-  include {
-    phase: TEST
-  }
-}
-layer {
-  name: "acc/top-5"
-  type: "Accuracy"
-  bottom: "fc1"
-  bottom: "label"
-  top: "acc/top-5"
-  include {
-    phase: TEST
-  }
-  accuracy_param {
-    top_k: 5
-  }
-}
+
diff --git a/models/intel_optimized_models/int8/resnet50_int8.prototxt b/models/intel_optimized_models/int8/resnet50_int8.prototxt
index c48020181..8d6aacd66 100644
--- a/models/intel_optimized_models/int8/resnet50_int8.prototxt
+++ b/models/intel_optimized_models/int8/resnet50_int8.prototxt
@@ -1,3 +1,4 @@
+# For INT8 reference
 name: "ResNet-50"
 layer {
   name: "data"
@@ -6,10 +7,10 @@ layer {
   dummy_data_param {
     data_filler {
       type: "constant"
-      value: 0.0099999997764825821
+      value: 0.01
     }    
     shape {
-      dim: 50
+      dim: 64
       dim: 3
       dim: 224
       dim: 224
@@ -25,7 +26,7 @@ layer {
       type: "constant"
     }    
     shape {
-      dim: 50
+      dim: 64
     }    
   }
 }
@@ -263,7 +264,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 19.9799995422
-    scale_out: 5.73999977112
+    scale_out: 11.5200004578
     scale_params: 72.1699981689
   }
 }
@@ -434,7 +435,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 19.5799999237
-    scale_out: 5.73999977112
+    scale_out: 11.5200004578
     scale_params: 88.4599990845
   }
 }
@@ -605,7 +606,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 13.5799999237
-    scale_out: 5.73999977112
+    scale_out: 11.5200004578
     scale_params: 103.910003662
   }
 }
@@ -822,7 +823,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 25.5400009155
-    scale_out: 4.78000020981
+    scale_out: 9.59000015259
     scale_params: 65.7200012207
   }
 }
@@ -993,7 +994,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 20.4899997711
-    scale_out: 4.78000020981
+    scale_out: 9.59000015259
     scale_params: 55.6899986267
   }
 }
@@ -1164,7 +1165,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 3.74000000954
-    scale_out: 4.78000020981
+    scale_out: 9.59000015259
     scale_params: 66.2300033569
   }
 }
@@ -1335,7 +1336,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 15.0600004196
-    scale_out: 4.78000020981
+    scale_out: 9.59000015259
     scale_params: 113.980003357
   }
 }
@@ -1552,7 +1553,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 15.3699998856
-    scale_out: 3.70000004768
+    scale_out: 7.42999982834
     scale_params: 75.6200027466
   }
 }
@@ -1723,7 +1724,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 6.44000005722
-    scale_out: 3.70000004768
+    scale_out: 7.42999982834
     scale_params: 67.4400024414
   }
 }
@@ -1894,7 +1895,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 6.94999980927
-    scale_out: 3.70000004768
+    scale_out: 7.42999982834
     scale_params: 76.9700012207
   }
 }
@@ -2065,7 +2066,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 5.40000009537
-    scale_out: 3.70000004768
+    scale_out: 7.42999982834
     scale_params: 77.1500015259
   }
 }
@@ -2236,7 +2237,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 6.51999998093
-    scale_out: 3.70000004768
+    scale_out: 7.42999982834
     scale_params: 98.8199996948
   }
 }
@@ -2407,7 +2408,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 5.01999998093
-    scale_out: 3.70000004768
+    scale_out: 7.42999982834
     scale_params: 93.3000030518
   }
 }
@@ -2624,7 +2625,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 25.2000007629
-    scale_out: 0.939999997616
+    scale_out: 1.87999999523
     scale_params: 27.1299991608
   }
 }
@@ -2795,7 +2796,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 29.2800006866
-    scale_out: 0.939999997616
+    scale_out: 1.87999999523
     scale_params: 35.3400001526
   }
 }
@@ -2966,7 +2967,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 14.7100000381
-    scale_out: 0.939999997616
+    scale_out: 1.87999999523
     scale_params: 23.2399997711
   }
 }
@@ -3031,26 +3032,4 @@ layer {
     }
   }
 }
-layer {
-  name: "accuracy/top-1"
-  type: "Accuracy"
-  bottom: "fc1000"
-  bottom: "label"
-  top: "accuracy-top1"
-  include {
-    phase: TEST
-  }
-}
-layer {
-  name: "accuracy/top-5"
-  type: "Accuracy"
-  bottom: "fc1000"
-  bottom: "label"
-  top: "accuracy-top5"
-  include {
-    phase: TEST
-  }
-  accuracy_param {
-    top_k: 5
-  }
-}
+
diff --git a/models/intel_optimized_models/int8/resnet50_sparse_int8.prototxt b/models/intel_optimized_models/int8/resnet50_sparse_int8.prototxt
index 402b24a63..22eb796ff 100644
--- a/models/intel_optimized_models/int8/resnet50_sparse_int8.prototxt
+++ b/models/intel_optimized_models/int8/resnet50_sparse_int8.prototxt
@@ -1,3 +1,4 @@
+# For INT8 reference
 name: "ResNet-50"
 layer {
   name: "data"
@@ -263,7 +264,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 19.9799995422
-    scale_out: 6.03000020981
+    scale_out: 12.1099996567
     scale_params: 72.1699981689
   }
 }
@@ -434,7 +435,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 19.5799999237
-    scale_out: 6.03000020981
+    scale_out: 12.1099996567
     scale_params: 88.4599990845
   }
 }
@@ -616,7 +617,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 16.9200000763
-    scale_out: 5.73999977112
+    scale_out: 11.5200004578
     scale_params: 103.910003662
   }
 }
@@ -833,7 +834,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 25.5400009155
-    scale_out: 4.65000009537
+    scale_out: 9.32999992371
     scale_params: 65.7200012207
   }
 }
@@ -1004,7 +1005,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 20.4899997711
-    scale_out: 4.65000009537
+    scale_out: 9.32999992371
     scale_params: 55.6899986267
   }
 }
@@ -1175,7 +1176,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 3.70000004768
-    scale_out: 4.65000009537
+    scale_out: 9.32999992371
     scale_params: 66.2300033569
   }
 }
@@ -1357,7 +1358,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 14.6999998093
-    scale_out: 4.88999986649
+    scale_out: 9.82999992371
     scale_params: 113.980003357
   }
 }
@@ -1574,7 +1575,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 14.8900003433
-    scale_out: 4.28000020981
+    scale_out: 8.60000038147
     scale_params: 75.6200027466
   }
 }
@@ -1745,7 +1746,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 6.30999994278
-    scale_out: 4.28000020981
+    scale_out: 8.60000038147
     scale_params: 67.4400024414
   }
 }
@@ -1916,7 +1917,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 6.90999984741
-    scale_out: 4.28000020981
+    scale_out: 8.60000038147
     scale_params: 76.9700012207
   }
 }
@@ -2087,7 +2088,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 5.40000009537
-    scale_out: 4.28000020981
+    scale_out: 8.60000038147
     scale_params: 77.1500015259
   }
 }
@@ -2258,7 +2259,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 6.51999998093
-    scale_out: 4.28000020981
+    scale_out: 8.60000038147
     scale_params: 98.8199996948
   }
 }
@@ -2440,7 +2441,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 16.6200008392
-    scale_out: 4.23000001907
+    scale_out: 8.5
     scale_params: 93.3000030518
   }
 }
@@ -2657,7 +2658,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 25.2000007629
-    scale_out: 0.939999997616
+    scale_out: 1.87999999523
     scale_params: 27.1299991608
   }
 }
@@ -2828,7 +2829,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 26.6200008392
-    scale_out: 0.939999997616
+    scale_out: 1.87999999523
     scale_params: 35.3400001526
   }
 }
@@ -2999,7 +3000,7 @@ layer {
     bw_layer_out: 8
     bw_params: 8
     scale_in: 14.7100000381
-    scale_out: 0.939999997616
+    scale_out: 1.87999999523
     scale_params: 23.2399997711
   }
 }
@@ -3064,36 +3065,4 @@ layer {
     }
   }
 }
-layer {
-  name: "prob"
-  type: "SoftmaxWithLoss"
-  bottom: "fc1000"
-  bottom: "label"
-  top: "prob"
-  include {
-    phase: TRAIN
-  }
-}
-layer {
-  name: "accuracy/top-1"
-  type: "Accuracy"
-  bottom: "fc1000"
-  bottom: "label"
-  top: "accuracy-top1"
-  include {
-    phase: TEST
-  }
-}
-layer {
-  name: "accuracy/top-5"
-  type: "Accuracy"
-  bottom: "fc1000"
-  bottom: "label"
-  top: "accuracy-top5"
-  include {
-    phase: TEST
-  }
-  accuracy_param {
-    top_k: 5
-  }
-}
+
diff --git a/models/intel_optimized_models/int8/ssd_int8.prototxt b/models/intel_optimized_models/int8/ssd_int8.prototxt
index 26e1a28dc..4a0ed0332 100644
--- a/models/intel_optimized_models/int8/ssd_int8.prototxt
+++ b/models/intel_optimized_models/int8/ssd_int8.prototxt
@@ -1,3 +1,4 @@
+# For INT8 reference
 name: "VGG_VOC0712_SSD_300x300_test"
 layer {
   name: "data"
@@ -1946,33 +1947,9 @@ layer {
       nms_threshold: 0.449999988079
       top_k: 400
     }
-    save_output_param {
-      output_directory: "data/ssd_out/VOC2007/SSD_300x300"
-      output_name_prefix: "comp4_det_test_"
-      output_format: "VOC"
-      label_map_file: "data/VOC0712/labelmap_voc.prototxt"
-      name_size_file: "data/VOC0712/test_name_size.txt"
-      num_test_image: 4952
-    }
     code_type: CENTER_SIZE
     keep_top_k: 200
     confidence_threshold: 0.00999999977648
   }
 }
-layer {
-  name: "detection_eval"
-  type: "DetectionEvaluate"
-  bottom: "detection_out"
-  bottom: "label"
-  top: "detection_eval"
-  include {
-    phase: TEST
-  }
-  detection_evaluate_param {
-    num_classes: 21
-    background_label_id: 0
-    overlap_threshold: 0.5
-    evaluate_difficult_gt: false
-    name_size_file: "data/VOC0712/test_name_size.txt"
-  }
-}
+

From c29e6fae40ff7c3ec56a70f4a10f718e01c5110e Mon Sep 17 00:00:00 2001
From: Shane Li <shane.li@intel.com>
Date: Fri, 12 Jan 2018 16:46:33 +0800
Subject: [PATCH 52/53] Fix batch size change issue

---
 scripts/run_benchmark.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/scripts/run_benchmark.py b/scripts/run_benchmark.py
index 7f67764e0..93d68ba4d 100755
--- a/scripts/run_benchmark.py
+++ b/scripts/run_benchmark.py
@@ -108,7 +108,7 @@ def obtain_model_file(self, model):
             for line in src_f.readlines():
                 if re.match(batch_size_pattern, line) and cnt < batch_size_cnt:
                    #change batch size
-                    re.sub("[0-9]+", new_batch_size, line, count = 1)
+                    line = re.sub("[0-9]+", new_batch_size, line, count = 1)
                     cnt += 1
                 dst_f.write(line) 
         return dst_model_file

From 4bb950c12b8852f3c190622e79e2ed824686e55c Mon Sep 17 00:00:00 2001
From: Shane Li <shane.li@intel.com>
Date: Fri, 12 Jan 2018 21:42:00 +0800
Subject: [PATCH 53/53] Correct batch size pattern used on lmdb dataset
 benchmarking and make the error log more clear

---
 scripts/run_benchmark.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/scripts/run_benchmark.py b/scripts/run_benchmark.py
index 93d68ba4d..3da1f5434 100755
--- a/scripts/run_benchmark.py
+++ b/scripts/run_benchmark.py
@@ -97,7 +97,7 @@ def obtain_model_file(self, model):
         src_model_file = "/".join([self.model_path, model, prototxt_file])
         if not os.path.isfile(src_model_file):
             logging.exception("template model file {} doesn't exist.".format(src_model_file))
-        batch_size_pattern = re.compile(".*shape:.*") if self.dummy_data_use else re.compile(".*batch size:.*")
+        batch_size_pattern = re.compile(".*shape:.*") if self.dummy_data_use else re.compile("^\s+batch_size:.*")
         # we only care about train phase batch size for benchmarking
         batch_size_cnt = 2 if self.dummy_data_use else 1
         if model not in self.bkm_batch_size or self.cpu_model not in self.bkm_batch_size[model]:
@@ -200,7 +200,7 @@ def obtain_average_fwd_bwd_time(self):
                     if re.match(average_fwd_bwd_time_pattern, line):
                         average_time = line.split()[-2]
             if average_time == "": 
-                logging.exception("Error: running intelcaffe failed, please check logs under: {}".format(result_file))
+                logging.exception("Error: can't find average forward-backward time within logs, please check logs under: {}".format(result_file))
             average_time = float(average_time)
         else:
             start_iteration = 100
@@ -228,7 +228,7 @@ def obtain_batch_size(self):
         with open(log_file, 'r') as f:
             batch_size_pattern_time = re.compile(".*SetMinibatchSize.*")
             batch_size_pattern_dummy = re.compile(".*dim:.*")
-            batch_size_pattern_real = re.compile(".*batch_size:.*")
+            batch_size_pattern_real = re.compile("^\s+batch_size:.*")
             batch_size = ''
             for line in f.readlines():
                 if re.match(batch_size_pattern_time, line) or re.match(batch_size_pattern_real, line) or re.match(batch_size_pattern_dummy, line):