RachelXu7
diff --git a/‎deploy/cpp/README.md
+2-2 b/‎deploy/cpp/README.md
+2-2
diff --git a/‎deploy/python/README.md
+1-46 b/‎deploy/python/README.md
+1-46
diff --git a/‎deploy/python/infer.py
+3-1 b/‎deploy/python/infer.py
+3-1
diff --git a/‎deploy/python/infer_benchmark.py
+207 b/‎deploy/python/infer_benchmark.py
+207
diff --git a/‎docs/slim/quant/quant.md
+10-12 b/‎docs/slim/quant/quant.md
+10-12
diff --git a/‎paddleseg/models/backbones/hrnet.py
+10-4 b/‎paddleseg/models/backbones/hrnet.py
+10-4
@@ -1,8 +1,8 @@
 # PaddleSeg C++ 预测部署方案
 
-## 使用Paddle Inference部署PaddleSeg模型
+## 使用Paddle Inference C++部署PaddleSeg模型
 
-使用Paddle Inference部署PaddleSeg模型，请参考[教程](../../docs/deployment/inference/cpp_inference.md)。
+使用Paddle Inference C++部署PaddleSeg模型，请参考[教程](../../docs/deployment/inference/cpp_inference.md)。
 
 ## 使用PaddleX部署PaddleSeg模型
 
 
@@ -1,46 +1 @@
-# PaddleSeg Python 预测部署方案
-
-## 1. 说明
-
-本文档介绍使用飞桨推理的Python接口在服务器端部署分割模型。大家通过一定的配置，加上少量的代码，即可把模型集成到自己的服务中，完成图像分割的任务。
-
-飞桨推理的[官网文档](https://paddleinference.paddlepaddle.org.cn/product_introduction/summary.html)介绍了部署模型的步骤、多种API接口、示例等等，大家可以根据实际需求进行使用。
-
-## 2. 前置准备
-
-请使用[模型导出工具](../../docs/model_export.md)导出您的模型, 或点击下载我们的[样例模型](https://paddleseg.bj.bcebos.com/dygraph/demo/bisenet_demo_model.tar.gz)用于测试。
-
-接着准备一张测试图片用于试验效果，我们提供了cityscapes验证集中的一张[图片](https://paddleseg.bj.bcebos.com/dygraph/demo/cityscapes_demo.png)用于演示效果，如果您的模型是使用其他数据集训练的，请自行准备测试图片。
-
-## 3. 预测
-
-在终端输入以下命令进行预测:
-```shell
-python deploy/python/infer.py --config /path/to/deploy.yaml --image_path /path/to/image/path/or/dir
-```
-
-参数说明如下:
-|参数名|用途|是否必选项|默认值|
-|-|-|-|-|
-|config|**导出模型时生成的配置文件**, 而非configs目录下的配置文件|是|-|
-|image_path|预测图片的路径或者目录或者文件列表|是|-|
-|batch_size|单卡batch size|否|1|
-|save_dir|保存预测结果的目录|否|output|
-|device|预测执行设备，可选项有'cpu','gpu'|否|'gpu'|
-|use_trt|是否开启TensorRT来加速预测|否|False|
-|precision|启动TensorRT预测时的数值精度，可选项有'fp32','fp16','int8'|否|'fp32'|
-|cpu_threads|使用cpu预测的线程数|否|10|
-|enable_mkldnn|是否使用MKL-DNN加速cpu预测|否|False|
-|benchmark|是否产出日志，包含环境、模型、配置、性能信息|否|False|
-|with_argmax|对预测结果进行argmax操作|否|否|
-
-*测试样例和预测结果如下*
-![cityscape_predict_demo.png](../../docs/images/cityscapes_predict_demo.png)
-
-**注意**
-
-1. 当使用量化模型预测时，需要同时开启TensorRT预测和int8预测才会有加速效果
-
-2. 使用TensorRT需要使用支持TRT功能的Paddle库，请参考[附录](https://www.paddlepaddle.org.cn/documentation/docs/zh/install/Tables.html#whl-release)下载对应的PaddlePaddle安装包，或者参考[源码编译](https://www.paddlepaddle.org.cn/documentation/docs/zh/install/compile/fromsource.html)自行编译
-
-3. 要开启`--benchmark`的话需要安装auto_log。[安装方式](https://github.com/LDOUBLEV/AutoLog)
+使用Paddle Inference Python部署PaddleSeg模型，请参考[教程](../../docs/deployment/inference/python_inference.md)。
@@ -75,6 +75,7 @@ def __init__(self, args):
         if args.device == 'gpu':
             # set GPU configs accordingly
             # such as intialize the gpu memory, enable tensorrt
+            logger.info("Use GPU")
             pred_cfg.enable_use_gpu(100, 0)
             pred_cfg.switch_ir_optim(True)
             precision_map = {
@@ -100,6 +101,7 @@ def __init__(self, args):
         else:
             # set CPU configs accordingly,
             # such as enable_mkldnn, set_cpu_math_library_num_threads
+            logger.info("Use CPU")
             pred_cfg.disable_gpu()
             if args.enable_mkldnn:
                 # cache 10 different shapes for mkldnn to avoid memory leak
@@ -109,7 +111,7 @@ def __init__(self, args):
 
         self.predictor = create_predictor(pred_cfg)
 
-        if args.benchmark:
+        if hasattr(self.args, 'benchmark') and self.args.benchmark:
             import auto_log
             pid = os.getpid()
             self.autolog = auto_log.AutoLogger(
 
@@ -0,0 +1,207 @@
+# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+import argparse
+import codecs
+import os
+import sys
+
+import time
+import yaml
+import numpy as np
+import paddle
+
+LOCAL_PATH = os.path.dirname(os.path.abspath(__file__))
+sys.path.append(os.path.join(LOCAL_PATH, '..', '..'))
+
+from paddleseg.cvlibs import manager
+from paddleseg.utils import logger, metrics, progbar
+
+from infer import Predictor
+
+
+def parse_args():
+    parser = argparse.ArgumentParser(description='Model Infer')
+    parser.add_argument(
+        "--config",
+        dest="cfg",
+        help="The config file.",
+        default=None,
+        type=str,
+        required=True)
+
+    parser.add_argument(
+        '--dataset_type',
+        dest='dataset_type',
+        help='The name of dataset, such as Cityscapes, PascalVOC and ADE20K.',
+        type=str,
+        default=None,
+        required=True)
+    parser.add_argument(
+        '--dataset_path',
+        dest='dataset_path',
+        help='The directory of the dataset to be predicted. If set dataset_path, '
+        'it use the test and label images to calculate the mIoU.',
+        type=str,
+        default=None,
+        required=True)
+    parser.add_argument(
+        '--dataset_mode',
+        dest='dataset_mode',
+        help='The dataset mode, such as train, val.',
+        type=str,
+        default="val")
+    parser.add_argument(
+        '--batch_size',
+        dest='batch_size',
+        help='Mini batch size of one gpu or cpu.',
+        type=int,
+        default=1)
+
+    parser.add_argument(
+        '--device',
+        choices=['cpu', 'gpu'],
+        default="gpu",
+        help="Select which device to inference, defaults to gpu.")
+
+    parser.add_argument(
+        '--use_trt',
+        default=False,
+        type=eval,
+        choices=[True, False],
+        help='Whether to use Nvidia TensorRT to accelerate prediction.')
+    parser.add_argument(
+        "--precision",
+        default="fp32",
+        type=str,
+        choices=["fp32", "fp16", "int8"],
+        help='The tensorrt precision.')
+
+    parser.add_argument(
+        '--cpu_threads',
+        default=10,
+        type=int,
+        help='Number of threads to predict when using cpu.')
+    parser.add_argument(
+        '--enable_mkldnn',
+        default=False,
+        type=eval,
+        choices=[True, False],
+        help='Enable to use mkldnn to speed up when using cpu.')
+
+    parser.add_argument(
+        '--with_argmax',
+        dest='with_argmax',
+        help='Perform argmax operation on the predict result.',
+        action='store_true')
+
+    parser.add_argument(
+        '--print_detail',
+        dest='print_detail',
+        help='Print GLOG information of Paddle Inference.',
+        action='store_true')
+
+    return parser.parse_args()
+
+
+class DatasetPredictor(Predictor):
+    def __init__(self, args):
+        super().__init__(args)
+
+    def test_dataset(self):
+        """
+        Read the data from dataset and calculate the accurary of the inference model.
+        """
+        comp = manager.DATASETS
+        if self.args.dataset_type not in comp.components_dict:
+            raise RuntimeError("The dataset is not supported.")
+        kwargs = {
+            'transforms': self.cfg.transforms.transforms,
+            'dataset_root': self.args.dataset_path,
+            'mode': self.args.dataset_mode
+        }
+        dataset = comp[self.args.dataset_type](**kwargs)
+
+        input_names = self.predictor.get_input_names()
+        input_handle = self.predictor.get_input_handle(input_names[0])
+        output_names = self.predictor.get_output_names()
+        output_handle = self.predictor.get_output_handle(output_names[0])
+
+        intersect_area_all = 0
+        pred_area_all = 0
+        label_area_all = 0
+        total_time = 0
+        progbar_val = progbar.Progbar(target=len(dataset), verbose=1)
+
+        for idx, (img, label) in enumerate(dataset):
+            data = np.array([img])
+            input_handle.reshape(data.shape)
+            input_handle.copy_from_cpu(data)
+
+            start_time = time.time()
+            self.predictor.run()
+            end_time = time.time()
+            total_time += (end_time - start_time)
+
+            pred = output_handle.copy_to_cpu()
+            pred = self.postprocess(paddle.to_tensor(pred))
+            label = paddle.to_tensor(label, dtype="int32")
+
+            intersect_area, pred_area, label_area = metrics.calculate_area(
+                pred,
+                label,
+                dataset.num_classes,
+                ignore_index=dataset.ignore_index)
+
+            intersect_area_all = intersect_area_all + intersect_area
+            pred_area_all = pred_area_all + pred_area
+            label_area_all = label_area_all + label_area
+
+            progbar_val.update(idx + 1)
+
+        class_iou, miou = metrics.mean_iou(intersect_area_all, pred_area_all,
+                                           label_area_all)
+        class_acc, acc = metrics.accuracy(intersect_area_all, pred_area_all)
+        kappa = metrics.kappa(intersect_area_all, pred_area_all, label_area_all)
+
+        logger.info(
+            "[EVAL] #Images: {} mIoU: {:.4f} Acc: {:.4f} Kappa: {:.4f} ".format(
+                len(dataset), miou, acc, kappa))
+        logger.info("[EVAL] Class IoU: \n" + str(np.round(class_iou, 4)))
+        logger.info("[EVAL] Class Acc: \n" + str(np.round(class_acc, 4)))
+        logger.info("[EVAL] Average time: %.3f second/img" %
+                    (total_time / len(dataset)))
+
+
+def main(args):
+    predictor = DatasetPredictor(args)
+    if args.dataset_type and args.dataset_path:
+        predictor.test_dataset()
+    else:
+        raise RuntimeError("Please set dataset_type and dataset_path.")
+
+
+if __name__ == '__main__':
+    """
+    Based on the infer config and dataset, this program read the test and
+    label images, applys the transfors, run the predictor, ouput the accuracy.
+
+    For example:
+    python deploy/python/infer_benchmark.py \
+        --config path/to/bisenetv2/deploy.yaml \
+        --dataset_type Cityscapes \
+        --dataset_path path/to/cityscapes
+    """
+    args = parse_args()
+    main(args)
@@ -12,20 +12,18 @@ PaddleSeg基于PaddleSlim，集成了量化训练（QAT）方法，特点如下
 
 ## 1 环境准备
 
-首先，请确保准备好PaddleSeg的基础环境。大家可以在PaddleSeg根目录执行如下命令，如果在`PaddleSeg/output`文件夹中出现预测结果，则证明安装成功。
+请参考[安装文档](../../install.md)准备好PaddleSeg的基础环境，测试是否安装成功。
 
-```
-python predict.py \
-       --config configs/quick_start/bisenet_optic_disc_512x512_1k.yml \
-       --model_path https://bj.bcebos.com/paddleseg/dygraph/optic_disc/bisenet_optic_disc_512x512_1k/model.pdparams\
-       --image_path docs/images/optic_test_image.jpg \
-       --save_dir output/result
-```
-
-然后，大家需要再安装最新版本的PaddleSlim。
+安装PaddleSlim。
 
 ```shell
-pip install paddleslim -i https://pypi.tuna.tsinghua.edu.cn/simple
+git clone https://github.com/PaddlePaddle/PaddleSlim.git
+
+# 切换到特定commit id
+git reset --hard 15ef0c7dcee5a622787b7445f21ad9d1dea0a933
+
+# 安装
+python setup.py install
 ```
 
 ## 2 产出量化模型
@@ -40,7 +38,7 @@ pip install paddleslim -i https://pypi.tuna.tsinghua.edu.cn/simple
 
 ```shell
 # 设置1张可用的GPU卡
-export CUDA_VISIBLE_DEVICES=0 
+export CUDA_VISIBLE_DEVICES=0
 # windows下请执行以下命令
 # set CUDA_VISIBLE_DEVICES=0
 
 
@@ -360,6 +360,9 @@ def __init__(self,
                 reduction_ratio=16,
                 name=name + '_fc')
 
+        self.add = layers.add()
+        self.relu = layers.Activation("relu")
+
     def forward(self, x):
         residual = x
         conv1 = self.conv1(x)
@@ -372,8 +375,8 @@ def forward(self, x):
         if self.has_se:
             conv3 = self.se(conv3)
 
-        y = conv3 + residual
-        y = F.relu(y)
+        y = self.add(conv3, residual)
+        y = self.relu(y)
         return y
 
 
@@ -419,6 +422,9 @@ def __init__(self,
                 reduction_ratio=16,
                 name=name + '_fc')
 
+        self.add = layers.add()
+        self.relu = layers.Activation("relu")
+
     def forward(self, x):
         residual = x
         conv1 = self.conv1(x)
@@ -430,8 +436,8 @@ def forward(self, x):
         if self.has_se:
             conv2 = self.se(conv2)
 
-        y = conv2 + residual
-        y = F.relu(y)
+        y = self.add(conv2, residual)
+        y = self.relu(y)
         return y