intel
diff --git a/‎Makefile.config.example‎
Lines changed: 3 additions & 0 deletions b/‎Makefile.config.example‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎cmake/Misc.cmake‎
Lines changed: 5 additions & 0 deletions b/‎cmake/Misc.cmake‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎examples/faster-rcnn/lib/fast_rcnn/net_sample_utils.py‎
Lines changed: 69 additions & 0 deletions b/‎examples/faster-rcnn/lib/fast_rcnn/net_sample_utils.py‎
Lines changed: 69 additions & 0 deletions
diff --git a/‎examples/faster-rcnn/lib/fast_rcnn/test.py‎
Lines changed: 45 additions & 3 deletions b/‎examples/faster-rcnn/lib/fast_rcnn/test.py‎
Lines changed: 45 additions & 3 deletions
diff --git a/‎examples/faster-rcnn/tools/test_net.py‎
Lines changed: 42 additions & 2 deletions b/‎examples/faster-rcnn/tools/test_net.py‎
Lines changed: 42 additions & 2 deletions
diff --git a/‎examples/rfcn/lib/fast_rcnn/net_sample_utils.py‎
Lines changed: 69 additions & 0 deletions b/‎examples/rfcn/lib/fast_rcnn/net_sample_utils.py‎
Lines changed: 69 additions & 0 deletions
diff --git a/‎examples/rfcn/lib/fast_rcnn/test.py‎
Lines changed: 40 additions & 2 deletions b/‎examples/rfcn/lib/fast_rcnn/test.py‎
Lines changed: 40 additions & 2 deletions
@@ -87,6 +87,9 @@ DISABLE_CONV_RELU_FUSION:= 0
 # Use Bn + ReLU fusion to boost inference
 DISABLE_BN_RELU_FUSION := 0
 
+# Use Conv + Concat  fusion to boost inference.
+ENABLE_CONCAT_FUSION := 0
+
 # Use Conv + Eltwise + Relu layer fusion to boost inference.
 DISABLE_CONV_SUM_FUSION := 0
 
 
@@ -21,6 +21,11 @@ if(DISABLE_BN_RELU_FUSION)
     add_definitions("-DDISABLE_BN_RELU_FUSION")
 endif()
 
+if(ENABLE_CONCAT_FUSION)
+	message(STATUS "conv/concat fusion is enabled!")
+	add_definitions("-DENABLE_CONCAT_FUSION")
+endif()
+
 if(DISABLE_CONV_SUM_FUSION)
 	message(STATUS "conv/eltwise/relu fusion is disabled!")
 	add_definitions("-DDISABLE_CONV_SUM_FUSION")
 
@@ -0,0 +1,69 @@
+# 
+# All modification made by Intel Corporation: Copyright (c) 2016 Intel Corporation
+# 
+# All contributions by the University of California:
+# Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
+# All rights reserved.
+# 
+# All other contributions:
+# Copyright (c) 2014, 2015, the respective contributors
+# All rights reserved.
+# For the list of contributors go to https://github.com/BVLC/caffe/blob/master/CONTRIBUTORS.md
+# 
+# 
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions are met:
+# 
+#     * Redistributions of source code must retain the above copyright notice,
+#       this list of conditions and the following disclaimer.
+#     * Redistributions in binary form must reproduce the above copyright
+#       notice, this list of conditions and the following disclaimer in the
+#       documentation and/or other materials provided with the distribution.
+#     * Neither the name of Intel Corporation nor the names of its contributors
+#       may be used to endorse or promote products derived from this software
+#       without specific prior written permission.
+# 
+# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
+# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+# SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+# OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+#
+import caffe
+import google.protobuf.text_format as txtf
+from caffe.proto import caffe_pb2
+
+def update_conv_quantized_dict(conv_quantized_dict, tmp_conv_quantized_dict):
+    for conv in conv_quantized_dict:
+        if tmp_conv_quantized_dict[conv][0] > conv_quantized_dict[conv][0]:
+            conv_quantized_dict[conv][0] = tmp_conv_quantized_dict[conv][0]
+
+        if tmp_conv_quantized_dict[conv][1] > conv_quantized_dict[conv][1]:
+            conv_quantized_dict[conv][1] = tmp_conv_quantized_dict[conv][1]
+
+
+def create_quantized_net(raw_net, quantized_net, conv_quantized_dict):
+    net_param = caffe_pb2.NetParameter()
+    with open(raw_net) as f:
+        txtf.Merge(f.read(), net_param)
+    #skip first conv layer when quantizing net
+    first_conv = True
+    for layer_param in net_param.layer:
+        if layer_param.type == "Convolution":
+            if first_conv:
+                first_conv = False
+                continue
+            layer_param.quantization_param.bw_layer_in = 8
+            layer_param.quantization_param.bw_layer_out = 8
+            layer_param.quantization_param.bw_params = 8
+            layer_param.quantization_param.scale_in.append(conv_quantized_dict[layer_param.name][0])
+            layer_param.quantization_param.scale_out.append(conv_quantized_dict[layer_param.name][1])
+            for param_scale in conv_quantized_dict[layer_param.name][2]:
+                layer_param.quantization_param.scale_params.append(param_scale)
+    with open(quantized_net, 'w') as f:
+        f.write(str(net_param))
@@ -10,14 +10,20 @@
 from fast_rcnn.config import cfg, get_output_dir
 from fast_rcnn.bbox_transform import clip_boxes, bbox_transform_inv
 import argparse
+from fast_rcnn import net_sample_utils
 from utils.timer import Timer
 import numpy as np
 import cv2
 import caffe
+import os
+import sys
+utilpath = os.path.split(os.path.realpath(__file__))[0] + "/../../../../scripts/"
+print utilpath
+sys.path.insert(0, utilpath)
+import sampling
 from fast_rcnn.nms_wrapper import nms
 import cPickle
 from utils.blob import im_list_to_blob
-import os
 
 def _get_image_blob(im):
     """Converts an image into a network input.
@@ -105,7 +111,7 @@ def _get_blobs(im, rois):
         blobs['rois'] = _get_rois_blob(rois, im_scale_factors)
     return blobs, im_scale_factors
 
-def im_detect(net, im, boxes=None):
+def im_detect(net, im, boxes=None, sample_blobs = None):
     """Detect object classes in an image given object proposals.
 
     Arguments:
@@ -152,7 +158,19 @@ def im_detect(net, im, boxes=None):
     else:
         forward_kwargs['rois'] = blobs['rois'].astype(np.float32, copy=False)
     blobs_out = net.forward(**forward_kwargs)
-
+    
+    
+
+    if sample_blobs != None:
+        for k, _ in net.blobs.items(): # top blob
+            output = np.array(net.blobs[k].data)
+            if k not in sample_blobs.keys():
+                sample_blobs[k] = [output]
+            else:
+                new_outputs = sample_blobs[k]
+                #print "new_outputs type: " + str(type(new_outputs))
+                new_outputs.append(output)
+                sample_blobs[k] = new_outputs
     if cfg.TEST.HAS_RPN:
         assert len(im_scales) == 1, "Only single-image batch implemented"
         rois = net.blobs['rois'].data.copy()
@@ -224,6 +242,30 @@ def apply_nms(all_boxes, thresh):
             nms_boxes[cls_ind][im_ind] = dets[keep, :].copy()
     return nms_boxes
 
+
+def sample_net(raw_net_prototxt, net, imdb, sampling_iterations, quant_mode, enable_first_conv = False, winograd_algo = False):
+
+    (conv_layers, test_net_top_names, test_net_bottom_names, conv_top_blob_layer_map, conv_bottom_blob_layer_map) = sampling.get_blob_map(net, enable_first_conv)
+    #currently out sample_net only supports TEST with HAS_RPN and AGNOSTIC flag
+    num_images = len(imdb.image_index)
+    image_index = 0
+    box_proposals = None
+    sample_blobs = {}
+    for iter_ in xrange(sampling_iterations):
+	im = cv2.imread(imdb.image_path_at(image_index))
+	im_detect(net, im, box_proposals, sample_blobs)
+	image_index += 1
+
+    params = {}
+    for k, _ in net.params.items():
+        if k not in conv_layers:
+            continue
+        param = np.abs(net.params[k][0].data) # ignore bias
+        params[k] = [param]
+
+    (winograd_bottoms, winograd_convolutions) = sampling.get_winograd_info(raw_net_prototxt, conv_bottom_blob_layer_map, winograd_algo)
+    return (sample_blobs, params, test_net_top_names, test_net_bottom_names, conv_top_blob_layer_map, conv_bottom_blob_layer_map, winograd_bottoms, winograd_convolutions)
+
 def test_net(net, imdb, max_per_image=100, thresh=0.05, vis=False):
     """Test a Fast R-CNN network on an image database."""
     num_images = len(imdb.image_index)
 
@@ -11,12 +11,19 @@
 
 import _init_paths
 from fast_rcnn.test import test_net
+from fast_rcnn.test import sample_net
+from fast_rcnn import net_sample_utils
 from fast_rcnn.config import cfg, cfg_from_file, cfg_from_list
 from datasets.factory import get_imdb
 import caffe
+
+import time, os, sys
+utilpath = os.path.split(os.path.realpath(__file__))[0] + "/../../../scripts/"
+sys.path.insert(0, utilpath)
+import calibrator
+import sampling
 import argparse
 import pprint
-import time, os, sys
 
 def parse_args():
     """
@@ -49,7 +56,27 @@ def parse_args():
     parser.add_argument('--num_dets', dest='max_per_image',
                         help='max number of detections per image',
                         default=100, type=int)
+    parser.add_argument('--quantized_net', action='store', dest='quantized_prototxt',
+			default=None, type=str)
+    parser.add_argument('--sample_iters', action='store', dest='sample_iters',
+                        default=100, type=int)
+    parser.add_argument('--quant_mode', action='store', dest='quant_mode',
+			default='single', type=str)
+
+    parser.add_argument('-u', '--unsigned_range', dest='unsigned_range', action="store_true", default=False,
+                        help='to quantize using unsigned range for activation')
 
+    parser.add_argument('-t', '--concat_use_fp32', dest='concat_use_fp32', action="store_true", default=False,
+                        help='to use fp32 for concat')
+
+    parser.add_argument('-f', '--unify_concat_scales', dest='unify_concat_scales', action="store_true", default=False,
+                        help='to unify concat scales')
+
+    parser.add_argument('-a', '--calibration_algos', dest='calibration_algos', action='store', default="DIRECT",
+                        help='to choose the calibration alogorithm')
+
+    parser.add_argument('-wi', '--conv_algo', dest='conv_algo', action="store_true", default=False,
+                        help='to choose the convolution algorithm')
     if len(sys.argv) == 1:
         parser.print_help()
         sys.exit(1)
@@ -87,4 +114,17 @@ def parse_args():
     if not cfg.TEST.HAS_RPN:
         imdb.set_proposal_method(cfg.TEST.PROPOSAL_METHOD)
 
-    test_net(net, imdb, max_per_image=args.max_per_image, vis=args.vis)
+    if args.quantized_prototxt == None:
+	test_net(net, imdb, max_per_image=args.max_per_image, vis=args.vis)
+    else:
+        (blobs, params, top_blobs_map, bottom_blobs_map, conv_top_blob_layer_map, conv_bottom_blob_layer_map, winograd_bottoms, winograd_convolutions) = sample_net(args.prototxt, net, imdb, args.sample_iters, args.quant_mode)
+
+        (inputs_max, outputs_max, inputs_min) = sampling.calibrate_activations(blobs, conv_top_blob_layer_map, conv_bottom_blob_layer_map, winograd_bottoms, args.calibration_algos, "SINGLE", args.conv_algo)
+        params_max = sampling.calibrate_parameters(params, winograd_convolutions, "DIRECT", args.quant_mode.upper(), args.conv_algo)
+        calibrator.generate_sample_impl(args.prototxt, args.quantized_prototxt, inputs_max, outputs_max, inputs_min, params_max, False)
+        compiled_net_str = caffe.compile_net(args.prototxt, caffe.TEST, "MKLDNN")
+        raw_net_basename = os.path.basename(args.prototxt)
+        compile_net_path = "./compiled_" + raw_net_basename
+        with open(compile_net_path, "w") as f:
+            f.write(compiled_net_str)
+        calibrator.transform_convolutions(args.quantized_prototxt, compile_net_path, top_blobs_map, bottom_blobs_map, args.unsigned_range, args.concat_use_fp32, args.unify_concat_scales, args.conv_algo, False)
@@ -0,0 +1,69 @@
+# 
+# All modification made by Intel Corporation: Copyright (c) 2016 Intel Corporation
+# 
+# All contributions by the University of California:
+# Copyright (c) 2014, 2015, The Regents of the University of California (Regents)
+# All rights reserved.
+# 
+# All other contributions:
+# Copyright (c) 2014, 2015, the respective contributors
+# All rights reserved.
+# For the list of contributors go to https://github.com/BVLC/caffe/blob/master/CONTRIBUTORS.md
+# 
+# 
+# Redistribution and use in source and binary forms, with or without
+# modification, are permitted provided that the following conditions are met:
+# 
+#     * Redistributions of source code must retain the above copyright notice,
+#       this list of conditions and the following disclaimer.
+#     * Redistributions in binary form must reproduce the above copyright
+#       notice, this list of conditions and the following disclaimer in the
+#       documentation and/or other materials provided with the distribution.
+#     * Neither the name of Intel Corporation nor the names of its contributors
+#       may be used to endorse or promote products derived from this software
+#       without specific prior written permission.
+# 
+# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
+# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+# DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
+# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
+# SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
+# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+# OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+#
+import caffe
+import google.protobuf.text_format as txtf
+from caffe.proto import caffe_pb2
+
+def update_conv_quantized_dict(conv_quantized_dict, tmp_conv_quantized_dict):
+    for conv in conv_quantized_dict:
+        if tmp_conv_quantized_dict[conv][0] > conv_quantized_dict[conv][0]:
+            conv_quantized_dict[conv][0] = tmp_conv_quantized_dict[conv][0]
+
+        if tmp_conv_quantized_dict[conv][1] > conv_quantized_dict[conv][1]:
+            conv_quantized_dict[conv][1] = tmp_conv_quantized_dict[conv][1]
+
+
+def create_quantized_net(raw_net, quantized_net, conv_quantized_dict):
+    net_param = caffe_pb2.NetParameter()
+    with open(raw_net) as f:
+        txtf.Merge(f.read(), net_param)
+    #skip first conv layer when quantizing net
+    first_conv = True
+    for layer_param in net_param.layer:
+        if layer_param.type == "Convolution":
+            if first_conv:
+                first_conv = False
+                continue
+            layer_param.quantization_param.bw_layer_in = 8
+            layer_param.quantization_param.bw_layer_out = 8
+            layer_param.quantization_param.bw_params = 8
+            layer_param.quantization_param.scale_in.append(conv_quantized_dict[layer_param.name][0])
+            layer_param.quantization_param.scale_out.append(conv_quantized_dict[layer_param.name][1])
+            for param_scale in conv_quantized_dict[layer_param.name][2]:
+                layer_param.quantization_param.scale_params.append(param_scale)
+    with open(quantized_net, 'w') as f:
+        f.write(str(net_param))
@@ -10,15 +10,21 @@
 from fast_rcnn.config import cfg, get_output_dir
 from fast_rcnn.bbox_transform import clip_boxes, bbox_transform_inv
 import argparse
+from fast_rcnn import net_sample_utils
 from utils.timer import Timer
 import numpy as np
 import cv2
 import caffe
+import os
+import sys
+utilpath = os.path.split(os.path.realpath(__file__))[0] + "/../../../../scripts/"
+print utilpath
+sys.path.insert(0, utilpath)
+import sampling
 from fast_rcnn.nms_wrapper import nms
 import cPickle
 import gzip
 from utils.blob import im_list_to_blob
-import os
 
 def _get_image_blob(im):
     """Converts an image into a network input.
@@ -106,7 +112,7 @@ def _get_blobs(im, rois):
         blobs['rois'] = _get_rois_blob(rois, im_scale_factors)
     return blobs, im_scale_factors
 
-def im_detect(net, im, boxes=None):
+def im_detect(net, im, boxes=None, sample_blobs = None):
     """Detect object classes in an image given object proposals.
 
     Arguments:
@@ -154,6 +160,16 @@ def im_detect(net, im, boxes=None):
         forward_kwargs['rois'] = blobs['rois'].astype(np.float32, copy=False)
     blobs_out = net.forward(**forward_kwargs)
 
+    if sample_blobs != None:
+        for k, _ in net.blobs.items(): # top blob
+            output = np.array(net.blobs[k].data)
+            if k not in sample_blobs.keys():
+                sample_blobs[k] = [output]
+            else:
+                new_outputs = sample_blobs[k]
+                #print "new_outputs type: " + str(type(new_outputs))
+                new_outputs.append(output)
+                sample_blobs[k] = new_outputs
     if cfg.TEST.HAS_RPN:
         assert len(im_scales) == 1, "Only single-image batch implemented"
         rois = net.blobs['rois'].data.copy()
@@ -225,6 +241,28 @@ def apply_nms(all_boxes, thresh):
             nms_boxes[cls_ind][im_ind] = dets[keep, :].copy()
     return nms_boxes
 
+def sample_net(raw_net_prototxt, net, imdb, sampling_iterations, quant_mode, enable_first_conv = False, winograd_algo = False):
+
+    (conv_layers, test_net_top_names, test_net_bottom_names, conv_top_blob_layer_map, conv_bottom_blob_layer_map) = sampling.get_blob_map(net, enable_first_conv)
+    #currently out sample_net only supports TEST with HAS_RPN and AGNOSTIC flag
+    num_images = len(imdb.image_index)
+    image_index = 0
+    box_proposals = None
+    sample_blobs = {}
+    for iter_ in xrange(sampling_iterations):
+	im = cv2.imread(imdb.image_path_at(image_index))
+	im_detect(net, im, box_proposals, sample_blobs)
+	image_index += 1
+
+    params = {}
+    for k, _ in net.params.items():
+        if k not in conv_layers:
+            continue
+        param = np.abs(net.params[k][0].data) # ignore bias
+        params[k] = [param]
+
+    (winograd_bottoms, winograd_convolutions) = sampling.get_winograd_info(raw_net_prototxt, conv_bottom_blob_layer_map, winograd_algo)
+    return (sample_blobs, params, test_net_top_names, test_net_bottom_names, conv_top_blob_layer_map, conv_bottom_blob_layer_map, winograd_bottoms, winograd_convolutions)
 def test_net(net, imdb, max_per_image=400, thresh=-np.inf, vis=False):
     """Test a Fast R-CNN network on an image database."""
     num_images = len(imdb.image_index)