3 jaren geleden · b781b3c619
--- a/PaddleDetection
+++ b/PaddleDetection
@@ -1 +1 @@
 
															-Subproject commit d41b085d66946219351d8d99c2b3d95756489624
														
 
															+Subproject commit 692d732994660ceba82c75034c802eb1138239cf
														
--- a/README.md
+++ b/README.md
@@ -5,7 +5,7 @@
 
															 <p align="left">
														
 
															     <a href="./LICENSE"><img src="https://img.shields.io/badge/license-Apache%202-red.svg"></a>
														
 
															-    <a href="https://github.com/PaddlePaddle/PaddleOCR/releases"><img src="https://img.shields.io/github/release/PaddlePaddle/PaddleX.svg"></a>
														
 
															+    <a href="https://github.com/PaddlePaddle/PaddleX/releases"><img src="https://img.shields.io/github/release/PaddlePaddle/PaddleX.svg"></a>
														
 
															     <a href=""><img src="https://img.shields.io/badge/python-3.6+-orange.svg"></a>
														
 
															     <a href=""><img src="https://img.shields.io/badge/os-linux%2C%20win%2C%20mac-yellow.svg"></a>
														
 
															     <a href=""><img src="https://img.shields.io/badge/QQ_Group-957286141-52B6EF?style=social&logo=tencent-qq&logoColor=000&logoWidth=20"></a>
														
@@ -27,6 +27,14 @@
 
															 ## 近期动态
														
 
															+
														
 
															+2021.12.10 PaddleX发布2.1.0版本
														
 
															+* 新增超轻量分类模型PPLCNet，在Intel CPU上，单张图像预测速度约5ms，ImageNet-1K数据集上Top1识别准确率达到80.82%，超越ResNet152的模型效果 [欢迎体验](./tutorials/train/image_classification/pplcnet.py)
														
 
															+* 新增轻量级检测特色模型PP-PicoDet，第一个在1M参数量之内mAP(0.5:0.95)超越30+(输入416像素时)，网络预测在ARM CPU下可达150FPS [欢迎体验](./tutorials/train/object_detection/picodet.py)
														
 
															+* 升级PaddleX Restful API，支持飞桨动态图开发模式 [欢迎体验](docs/Resful_API/docs/readme.md)
														
 
															+* 新增检测模型负样本训练策略 [欢迎体验](docs/data/format/detection.md#3)
														
 
															+* 新增python轻量级服务化部署 [欢迎体验](./docs/hub_serving_deploy.md)
														
 
															+
														
 
															 2021.09.10 PaddleX发布2.0.0正式版本。
														
 
															 - 全新发布Manufacture SDK，支持多模型串联部署。[欢迎体验](./deploy/cpp/docs/manufacture_sdk)
														
 
															 - PaddleX部署全面升级，支持飞桨视觉套件PaddleDetection、PaddleClas、PaddleSeg、PaddleX的端到端统一部署能力。[欢迎体验](./deploy/cpp/docs/deployment.md)
														
--- a/deploy/cpp/docs/compile/paddle/linux.md
+++ b/deploy/cpp/docs/compile/paddle/linux.md
@@ -39,7 +39,10 @@ PaddlePaddle C++ 预测库针对是否使用GPU、是否支持TensorRT、以及
 
															 ```
														
 
															 ### Step 3. 修改编译参数
														
 
															-根据自己的系统环境，修改`PaddleX/deploy/cpp/script/build.sh`脚本中的参数，主要修改的参数为以下几个
														
 
															+根据自己的系统环境，修改`PaddleX/deploy/cpp/
														
 
															+
														
 
															+
														
 
															+/build.sh`脚本中的参数，主要修改的参数为以下几个
														
 
															 | 参数          | 说明                                                                                 |
														
 
															 | :------------ | :----------------------------------------------------------------------------------- |
														
 
															 | WITH_GPU      | ON或OFF，表示是否使用GPU，当下载的为CPU预测库时，设为OFF                             |
														
@@ -54,7 +57,7 @@ PaddlePaddle C++ 预测库针对是否使用GPU、是否支持TensorRT、以及
 
															 ### Step 4. 编译
														
 
															 修改完build.sh后执行编译:  
														
 
															 ```commandline
														
 
															-sh script/build.sh
														
 
															+sh scripts/build.sh
														
 
															 ```
														
 
															 **[注意]**:
														
@@ -63,7 +66,7 @@ sh script/build.sh
 
															 #### 编译环境无法联网导致编译失败？
														
 
															-> 编译过程，会调用script/bootstrap.sh联网下载opencv、openssl，以及yaml依赖包，如无法联网，用户按照下操作手动下载
														
 
															+> 编译过程，会调用scripts/bootstrap.sh联网下载opencv、openssl，以及yaml依赖包，如无法联网，用户按照下操作手动下载
														
 
															 >
														
 
															 > 1. 根据系统版本，点击右侧链接下载不同版本的opencv依赖 [Ubuntu 16.04](https://bj.bcebos.com/paddleseg/deploy/opencv3.4.6gcc4.8ffmpeg.tar.gz2)/[Ubuntu 18.04](https://bj.bcebos.com/paddlex/deploy/opencv3.4.6gcc4.8ffmpeg_ubuntu_18.04.tar.gz2)
														
 
															 > 2. 解压下载的opencv依赖（解压后目录名为opencv3.4.6gcc4.8ffmpeg)，创建目录`PaddleX/deploy/cpp/deps`，将解压后的目录拷贝至该创建的目录下
														
--- a/deploy/cpp/docs/csharp_deploy/model_infer.cpp
+++ b/deploy/cpp/docs/csharp_deploy/model_infer.cpp
@@ -24,7 +24,7 @@ PaddleDeploy::Model* model;
 
															 * paddlex_model_type: When Model_Type is paddlx, the type of actual Paddlex model returned - det, seg, clas
														
 
															 *
														
 
															 */
														
 
															-extern "C" void InitModel(const char* model_type, const char* model_filename, const char* params_filename, const char* cfg_file, bool use_gpu, int gpu_id, char* paddlex_model_type)
														
 
															+extern "C" __declspec(dllexport) void InitModel(const char* model_type, const char* model_filename, const char* params_filename, const char* cfg_file, bool use_gpu, int gpu_id, char* paddlex_model_type)
														
 
															 {
														
 
															 	// create model
														
 
															 	model = PaddleDeploy::CreateModel(model_type);  //FLAGS_model_type
														
@@ -83,7 +83,7 @@ extern "C" void InitModel(const char* model_type, const char* model_filename, co
 
															 *
														
 
															 * extern "C"
														
 
															 */
														
 
															-extern "C" void Det_ModelPredict(const unsigned char* img, int nWidth, int nHeight, int nChannel, float* output, int* nBoxesNum, char* LabelList)
														
 
															+extern "C" __declspec(dllexport) void Det_ModelPredict(const unsigned char* img, int nWidth, int nHeight, int nChannel, float* output, int* nBoxesNum, char* LabelList)
														
 
															 {
														
 
															 	// prepare data
														
 
															 	std::vector<cv::Mat> imgs;
														
@@ -143,7 +143,7 @@ extern "C" void Det_ModelPredict(const unsigned char* img, int nWidth, int nHeig
 
															 *
														
 
															 * extern "C"
														
 
															 */
														
 
															-extern "C" void Seg_ModelPredict(const unsigned char* img, int nWidth, int nHeight, int nChannel, unsigned char* output)
														
 
															+extern "C" __declspec(dllexport) void Seg_ModelPredict(const unsigned char* img, int nWidth, int nHeight, int nChannel, unsigned char* output)
														
 
															 {
														
 
															 	// prepare data
														
 
															 	std::vector<cv::Mat> imgs;
														
@@ -192,7 +192,7 @@ extern "C" void Seg_ModelPredict(const unsigned char* img, int nWidth, int nHeig
 
															 *
														
 
															 * extern "C"
														
 
															 */
														
 
															-extern "C" void Cls_ModelPredict(const unsigned char* img, int nWidth, int nHeight, int nChannel, float* score, char* category, int* category_id)
														
 
															+extern "C" __declspec(dllexport) void Cls_ModelPredict(const unsigned char* img, int nWidth, int nHeight, int nChannel, float* score, char* category, int* category_id)
														
 
															 {
														
 
															 	// prepare data
														
 
															 	std::vector<cv::Mat> imgs;
														
@@ -245,7 +245,7 @@ extern "C" void Cls_ModelPredict(const unsigned char* img, int nWidth, int nHeig
 
															 *
														
 
															 * extern "C"
														
 
															 */
														
 
															-extern "C" void Mask_ModelPredict(const unsigned char* img, int nWidth, int nHeight, int nChannel, float* box_output, unsigned char* mask_output, int* nBoxesNum, char* LabelList)
														
 
															+extern "C" __declspec(dllexport) void Mask_ModelPredict(const unsigned char* img, int nWidth, int nHeight, int nChannel, float* box_output, unsigned char* mask_output, int* nBoxesNum, char* LabelList)
														
 
															 {
														
 
															 	// prepare data
														
 
															 	std::vector<cv::Mat> imgs;
														
@@ -305,7 +305,7 @@ extern "C" void Mask_ModelPredict(const unsigned char* img, int nWidth, int nHei
 
															 *
														
 
															 * extern "C"
														
 
															 */
														
 
															-extern "C" void DestructModel()
														
 
															+extern "C" __declspec(dllexport) void DestructModel()
														
 
															 {
														
 
															 	delete model;
														
 
															 	std::cout << "destruct model success" << std::endl;
														
--- a/docs/CHANGELOG.md
+++ b/docs/CHANGELOG.md
@@ -2,6 +2,24 @@
 
															 ## 最新版本信息
														
 
															+- **2021.12.10 v2.1.0**
														
 
															+
														
 
															+  * PaddleX API
														
 
															+    - 新增超轻量分类模型PPLCNet，在Intel CPU上，单张图像预测速度约5ms，ImageNet-1K数据集上Top1识别准确率达到80.82%，超越ResNet152的模型效果
														
 
															+    - 新增轻量级检测特色模型PP-PicoDet，第一个在1M参数量之内mAP(0.5:0.95)超越30+(输入416像素时)，网络预测在ARM CPU下可达150FPS
														
 
															+    - 新增检测模型负样本训练策略
														
 
															+
														
 
															+  * 预测部署
														
 
															+    - 新增python轻量级服务化部署
														
 
															+
														
 
															+  * PaddleX GUI
														
 
															+    - 新增超轻量分类模型PPLCNet、轻量级检测特色模型PP-PicoDet
														
 
															+
														
 
															+  * PaddleX Restful API
														
 
															+    - 全面升级，支持飞桨动态图开发模式
														
 
															+    - 提供Html Demo两种前端调用方式
														
 
															+
														
 
															+
														
 
															 - **2021.09.10 v2.0.0**
														
 
															   * PaddleX API
														
--- a/docs/Resful_API/docs/readme.md
+++ b/docs/Resful_API/docs/readme.md
@@ -31,19 +31,16 @@ PaddleX RESTful是基于PaddleX开发的RESTful API。对于开发者来说只
 
															 在该示例中PaddleX_Restful运行在一台带GPU的linux服务器下，用户通过其他电脑连接该服务器进行远程的操作。
														
 
															 ### 1  环境准备
														
 
															-在服务器下载PaddlePaddle和PaddleX及其他依赖
														
 
															-
														
 
															-* 下载PaddlePaddle
														
 
															-`pip install paddlepaddle-gpu -i `
														
 
															+在服务器下载PaddlePaddle和PaddleX及其他依赖
														
 
															-* 下载PaddleX
														
 
															+* 下载安装PaddleX>=2.1.0和PaddlePaddle>= 2.2.0
														
 
															-pip install paddlex==1.3.11 -i
														
 
															+详见[PaddleX API快速安装](../../../docs/quick_start_API.md#PaddleX-200安装)
														
 
															 * 下载pycuda（如果不使用GPU，该项可不进行下载）
														
 
															-pip install pycuda -i
														
 
															+pip install pycuda
														
 
															 ### 2  启动Restful服务
														
@@ -127,10 +124,10 @@ pip install pycuda -i
 
															 * ## 客户端图形化界面
														
 
															-客户端操作流程和Web界面基本一致，提供了MAC和Windows版本两种，用户可自行下载并操作
														
 
															-- [MAC](https://bj.bcebos.com/paddlex/PaddleX_Remote_GUI/mac/PaddleX_Remote_GUI.zip)
														
 
															-- [Windows](https://bj.bcebos.com/paddlex/PaddleX_Remote_GUI/windows/PaddleX_Remote_GUI.zip)
														
 
															+客户端操作流程和Web界面基本一致，提供了Windows版本，用户可自行下载并操作
														
 
															+
														
 
															+Windows客户端即将到来！
														
 
															 ### 4  Restful 二次开发说明
														
--- a/docs/apis/datasets.md
+++ b/docs/apis/datasets.md
@@ -30,7 +30,7 @@ paddlex.datasets.ImageNet(data_dir, file_list, label_list, transforms=None, num_
 
															 ## <h2 id="2">paddlex.datasets.VOCDetection</h2>
														
 
															 > **用于目标检测模型**  
														
 
															 ```python
														
 
															-paddlex.datasets.VOCDetection(data_dir, file_list, label_list, transforms=None, num_workers='auto', shuffle=False)
														
 
															+paddlex.datasets.VOCDetection(data_dir, file_list, label_list, transforms=None, num_workers='auto', shuffle=False, allow_empty=False, empty_ratio=1.)
														
 
															 ```
														
 
															 > 读取PascalVOC格式的检测数据集，并对样本进行相应的处理。PascalVOC数据集格式的介绍可查看文档:[数据集格式说明](../data/format/detection.md)  
														
@@ -46,6 +46,7 @@ paddlex.datasets.VOCDetection(data_dir, file_list, label_list, transforms=None,
 
															 > > * **num_workers** (int|str)：数据集中样本在预处理过程中的进程数。默认为'auto'。当设为'auto'时，根据系统的实际CPU核数设置`num_workers`: 如果CPU核数的一半大于8，则`num_workers`为8，否则为CPU核数的一半。
														
 
															 > > * **shuffle** (bool): 是否需要对数据集中样本打乱顺序。默认为False。
														
 
															 > > * **allow_empty** (bool): 是否加载负样本。默认为False。
														
 
															+> > * **empty_ratio** (float): 用于指定负样本占总样本数的比例。如果小于0或大于等于1，则保留全部的负样本。默认为1。
														
 
															 ### <h3 id="21">cluster_yolo_anchor</h3>
														
@@ -144,7 +145,7 @@ model.train(
 
															 ## <h2 id="3">paddlex.datasets.CocoDetection</h2>
														
 
															 > **用于实例分割/目标检测模型**  
														
 
															 ```python
														
 
															-paddlex.datasets.CocoDetection(data_dir, ann_file, transforms=None, num_workers='auto', shuffle=False)
														
 
															+paddlex.datasets.CocoDetection(data_dir, ann_file, transforms=None, num_workers='auto', shuffle=False, allow_empty=False, empty_ratio=1.)
														
 
															 ```
														
 
															 > 读取MSCOCO格式的检测数据集，并对样本进行相应的处理，该格式的数据集同样可以应用到实例分割模型的训练中。MSCOCO数据集格式的介绍可查看文档:[数据集格式说明](../data/format/instance_segmentation.md)  
														
@@ -159,6 +160,7 @@ paddlex.datasets.CocoDetection(data_dir, ann_file, transforms=None, num_workers=
 
															 > > * **num_workers** (int|str)：数据集中样本在预处理过程中的线程或进程数。默认为'auto'。当设为'auto'时，根据系统的实际CPU核数设置`num_workers`: 如果CPU核数的一半大于8，则`num_workers`为8，否则为CPU核数的一半。  
														
 
															 > > * **shuffle** (bool): 是否需要对数据集中样本打乱顺序。默认为False。
														
 
															 > > * **allow_empty** (bool): 是否加载负样本。默认为False。
														
 
															+> > * **empty_ratio** (float): 用于指定负样本占总样本数的比例。如果小于0或大于等于1，则保留全部的负样本。默认为1。
														
 
															 ### <h3 id="31">cluster_yolo_anchor</h3>
														
--- a/docs/apis/models/classification.md
+++ b/docs/apis/models/classification.md
@@ -25,7 +25,7 @@ paddlex.cls.ResNet50(num_classes=1000)
 
															 ### <h3 id="11">train</h3>
														
 
															 ```python
														
 
															-train(self, num_epochs, train_dataset, train_batch_size=64, eval_dataset=None, optimizer=None, save_interval_epochs=1, log_interval_steps=10, save_dir='output', pretrain_weights='IMAGENET', learning_rate=.025, warmup_steps=0, warmup_start_lr=0.0, lr_decay_epochs=(30, 60, 90), lr_decay_gamma=0.1, early_stop=False, early_stop_patience=5, use_vdl=True)
														
 
															+train(self, num_epochs, train_dataset, train_batch_size=64, eval_dataset=None, optimizer=None, save_interval_epochs=1, log_interval_steps=10, save_dir='output', pretrain_weights='IMAGENET', learning_rate=.025, warmup_steps=0, warmup_start_lr=0.0, lr_decay_epochs=(30, 60, 90), lr_decay_gamma=0.1, label_smoothing=None, early_stop=False, early_stop_patience=5, use_vdl=True)
														
 
															 ```
														
 
															 >
														
 
															 > **参数**
														
@@ -44,6 +44,7 @@ train(self, num_epochs, train_dataset, train_batch_size=64, eval_dataset=None, o
 
															 - **warmup_start_lr**(float): 默认优化器的warmup起始学习率，默认为0.0。
														
 
															 - **lr_decay_epochs** (list): 默认优化器的学习率衰减轮数。默认为[30, 60, 90]。
														
 
															 - **lr_decay_gamma** (float): 默认优化器的学习率衰减率。默认为0.1。
														
 
															+- **label_smoothing** (float, bool or None): 是否使用标签平滑。若为float，表示标签平滑系数。若为True，使用系数为0.1的标签平滑。若为None或False，则不采用标签平滑。默认为None。
														
 
															 - **early_stop** (bool): 是否使用提前终止训练策略。默认为False。
														
 
															 - **early_stop_patience** (int): 当使用提前终止训练策略时，如果验证集精度在`early_stop_patience`个epoch内连续下降或持平，则终止训练。默认为5。
														
 
															 - **use_vdl** (bool): 是否使用VisualDL进行可视化。默认为True。
														
@@ -171,43 +172,45 @@ quant_aware_train(self, num_epochs, train_dataset, train_batch_size=64, eval_dat
 
															 PaddleX提供了共计38种分类模型，所有分类模型均提供同`ResNet50`相同的训练`train`，评估`evaluate`，预测`predict`，敏感度分析`analyze_sensitivity`，剪裁`prune`和在线量化`quant_aware_train`接口，各模型效果可参考[模型库](../../appendix/model_zoo.md)。
														
 
															-| 模型              | 接口                    |
														
 
															-| :---------------- | :---------------------- |
														
 
															-| ResNet18          | paddlex.cls.ResNet18(num_classes=1000) |
														
 
															-| ResNet18_vd       | paddlex.cls.ResNet18_vd(num_classes=1000) |
														
 
															-| ResNet34          | paddlex.cls.ResNet34(num_classes=1000) |
														
 
															-| ResNet34_vd          | paddlex.cls.ResNet34_vd(num_classes=1000) |
														
 
															-| ResNet50          | paddlex.cls.ResNet50(num_classes=1000) |
														
 
															-| ResNet50_vd       | paddlex.cls.ResNet50_vd(num_classes=1000) |
														
 
															-| ResNet50_vd_ssld    | paddlex.cls.ResNet50_vd_ssld(num_classes=1000) |
														
 
															-| ResNet101          | paddlex.cls.ResNet101(num_classes=1000) |
														
 
															-| ResNet101_vd        | paddlex.cls.ResNet101_vd(num_classes=1000) |
														
 
															-| ResNet101_vd_ssld   | paddlex.cls.ResNet101_vd_ssld(num_classes=1000) |
														
 
															-| ResNet152 | paddlex.cls.ResNet152(num_classes=1000) |
														
 
															-| ResNet152_vd | paddlex.cls.ResNet152_vd(num_classes=1000) |
														
 
															-| ResNet200_vd | paddlex.cls.ResNet200_vd(num_classes=1000) |
														
 
															-| DarkNet53      | paddlex.cls.DarkNet53(num_classes=1000) |
														
 
															-| MobileNetV1         | paddlex.cls.MobileNetV1(num_classes=1000, scale=1.0) |
														
 
															-| MobileNetV2       | paddlex.cls.MobileNetV2(num_classes=1000, scale=1.0) |
														
 
															-| MobileNetV3_small       | paddlex.cls.MobileNetV3_small(num_classes=1000, scale=1.0) |
														
 
															-| MobileNetV3_small_ssld  | paddlex.cls.MobileNetV3_small_ssld(num_classes=1000, scale=1.0) |
														
 
															-| MobileNetV3_large   | paddlex.cls.MobileNetV3_large(num_classes=1000, scale=1.0) |
														
 
															-| MobileNetV3_large_ssld | paddlex.cls.MobileNetV3_large_ssld(num_classes=1000) |
														
 
															-| Xception41     | paddlex.cls.Xception41(num_classes=1000) |
														
 
															-| Xception65     | paddlex.cls.Xception65(num_classes=1000) |
														
 
															-| Xception71     | paddlex.cls.Xception71(num_classes=1000) |
														
 
															-| ShuffleNetV2     | paddlex.cls.ShuffleNetV2(num_classes=1000, scale=1.0) |
														
 
															-| ShuffleNetV2_swish     | paddlex.cls.ShuffleNetV2_swish(num_classes=1000) |
														
 
															-| DenseNet121      | paddlex.cls.DenseNet121(num_classes=1000) |
														
 
															-| DenseNet161       | paddlex.cls.DenseNet161(num_classes=1000) |
														
 
															-| DenseNet169       | paddlex.cls.DenseNet169(num_classes=1000) |
														
 
															-| DenseNet201       | paddlex.cls.DenseNet201(num_classes=1000) |
														
 
															-| DenseNet264       | paddlex.cls.DenseNet264(num_classes=1000) |
														
 
															-| HRNet_W18_C       | paddlex.cls.HRNet_W18_C(num_classes=1000) |
														
 
															-| HRNet_W30_C       | paddlex.cls.HRNet_W30_C(num_classes=1000) |
														
 
															-| HRNet_W32_C       | paddlex.cls.HRNet_W32_C(num_classes=1000) |
														
 
															-| HRNet_W40_C       | paddlex.cls.HRNet_W40_C(num_classes=1000) |
														
 
															-| HRNet_W44_C       | paddlex.cls.HRNet_W44_C(num_classes=1000) |
														
 
															-| HRNet_W48_C       | paddlex.cls.HRNet_W48_C(num_classes=1000) |
														
 
															-| HRNet_W64_C       | paddlex.cls.HRNet_W64_C(num_classes=1000) |
														
 
															-| AlexNet         | paddlex.cls.AlexNet(num_classes=1000) |
														
 
															+| 模型                     | 接口                                                              |
														
 
															+|:-----------------------|:----------------------------------------------------------------|
														
 
															+| PPLCNet                | paddlex.cls.PPLCNet(num_classes=1000)                           |
														
 
															+| PPLCNet_ssld                | paddlex.cls.PPLCNet_ssld(num_classes=1000)                      |
														
 
															+| ResNet18               | paddlex.cls.ResNet18(num_classes=1000)                          |
														
 
															+| ResNet18_vd            | paddlex.cls.ResNet18_vd(num_classes=1000)                       |
														
 
															+| ResNet34               | paddlex.cls.ResNet34(num_classes=1000)                          |
														
 
															+| ResNet34_vd            | paddlex.cls.ResNet34_vd(num_classes=1000)                       |
														
 
															+| ResNet50               | paddlex.cls.ResNet50(num_classes=1000)                          |
														
 
															+| ResNet50_vd            | paddlex.cls.ResNet50_vd(num_classes=1000)                       |
														
 
															+| ResNet50_vd_ssld       | paddlex.cls.ResNet50_vd_ssld(num_classes=1000)                  |
														
 
															+| ResNet101              | paddlex.cls.ResNet101(num_classes=1000)                         |
														
 
															+| ResNet101_vd           | paddlex.cls.ResNet101_vd(num_classes=1000)                      |
														
 
															+| ResNet101_vd_ssld      | paddlex.cls.ResNet101_vd_ssld(num_classes=1000)                 |
														
 
															+| ResNet152              | paddlex.cls.ResNet152(num_classes=1000)                         |
														
 
															+| ResNet152_vd           | paddlex.cls.ResNet152_vd(num_classes=1000)                      |
														
 
															+| ResNet200_vd           | paddlex.cls.ResNet200_vd(num_classes=1000)                      |
														
 
															+| DarkNet53              | paddlex.cls.DarkNet53(num_classes=1000)                         |
														
 
															+| MobileNetV1            | paddlex.cls.MobileNetV1(num_classes=1000, scale=1.0)            |
														
 
															+| MobileNetV2            | paddlex.cls.MobileNetV2(num_classes=1000, scale=1.0)            |
														
 
															+| MobileNetV3_small      | paddlex.cls.MobileNetV3_small(num_classes=1000, scale=1.0)      |
														
 
															+| MobileNetV3_small_ssld | paddlex.cls.MobileNetV3_small_ssld(num_classes=1000, scale=1.0) |
														
 
															+| MobileNetV3_large      | paddlex.cls.MobileNetV3_large(num_classes=1000, scale=1.0)      |
														
 
															+| MobileNetV3_large_ssld | paddlex.cls.MobileNetV3_large_ssld(num_classes=1000)            |
														
 
															+| Xception41             | paddlex.cls.Xception41(num_classes=1000)                        |
														
 
															+| Xception65             | paddlex.cls.Xception65(num_classes=1000)                        |
														
 
															+| Xception71             | paddlex.cls.Xception71(num_classes=1000)                        |
														
 
															+| ShuffleNetV2           | paddlex.cls.ShuffleNetV2(num_classes=1000, scale=1.0)           |
														
 
															+| ShuffleNetV2_swish     | paddlex.cls.ShuffleNetV2_swish(num_classes=1000)                |
														
 
															+| DenseNet121            | paddlex.cls.DenseNet121(num_classes=1000)                       |
														
 
															+| DenseNet161            | paddlex.cls.DenseNet161(num_classes=1000)                       |
														
 
															+| DenseNet169            | paddlex.cls.DenseNet169(num_classes=1000)                       |
														
 
															+| DenseNet201            | paddlex.cls.DenseNet201(num_classes=1000)                       |
														
 
															+| DenseNet264            | paddlex.cls.DenseNet264(num_classes=1000)                       |
														
 
															+| HRNet_W18_C            | paddlex.cls.HRNet_W18_C(num_classes=1000)                       |
														
 
															+| HRNet_W30_C            | paddlex.cls.HRNet_W30_C(num_classes=1000)                       |
														
 
															+| HRNet_W32_C            | paddlex.cls.HRNet_W32_C(num_classes=1000)                       |
														
 
															+| HRNet_W40_C            | paddlex.cls.HRNet_W40_C(num_classes=1000)                       |
														
 
															+| HRNet_W44_C            | paddlex.cls.HRNet_W44_C(num_classes=1000)                       |
														
 
															+| HRNet_W48_C            | paddlex.cls.HRNet_W48_C(num_classes=1000)                       |
														
 
															+| HRNet_W64_C            | paddlex.cls.HRNet_W64_C(num_classes=1000)                       |
														
 
															+| AlexNet                | paddlex.cls.AlexNet(num_classes=1000)                           |
														
--- a/docs/apis/models/detection.md
+++ b/docs/apis/models/detection.md
@@ -11,8 +11,9 @@
 
															   * [quant_aware_train](#16)
														
 
															 * [paddlex.det.PPYOLO](#2)
														
 
															 * [paddlex.det.PPYOLOTiny](#3)
														
 
															-* [paddlex.det.YOLOv3](#4)
														
 
															-* [paddlex.det.FasterRCNN](#5)
														
 
															+* [paddlex.det.PicoDet](#4)
														
 
															+* [paddlex.det.YOLOv3](#5)
														
 
															+* [paddlex.det.FasterRCNN](#6)
														
 
															 ## <h2 id="1">paddlex.det.PPYOLOv2</h2>
														
@@ -262,7 +263,33 @@ paddlex.det.PPYOLOTiny(num_classes=80, backbone='MobileNetV3', anchors=[[10, 15]
 
															 > - prune 剪裁接口说明同 [PPYOLOv2模型prune接口](#prune)
														
 
															 > - quant_aware_train 在线量化接口说明同 [PPYOLOv2模型quant_aware_train接口](#quant_aware_train)
														
 
															-## <h2 id="4">paddlex.det.YOLOv3</h2>
														
 
															+
														
 
															+## <h2 id="4">paddlex.det.PicoDet</h2>
														
 
															+
														
 
															+```python
														
 
															+paddlex.det.PicoDet(num_classes=80, backbone='ESNet_m', nms_score_threshold=.025, nms_topk=1000, nms_keep_topk=100, nms_iou_threshold=.6)
														
 
															+```
														
 
															+
														
 
															+> 构建PicoDet检测器。
														
 
															+
														
 
															+> **参数**
														
 
															+>
														
 
															+> > - **num_classes** (int): 类别数。默认为80。
														
 
															+> > - **backbone** (str): PicoDet的backbone网络，取值范围为['ESNet_s', 'ESNet_m', 'ESNet_l', 'LCNet', 'MobileNetV3', 'ResNet18_vd']。默认为'ESNet_m'。
														
 
															+> > - **nms_score_threshold** (float): 检测框的置信度得分阈值，置信度得分低于阈值的框应该被忽略。默认为0.01。
														
 
															+> > - **nms_topk** (int): 进行NMS时，根据置信度保留的最大检测框数。默认为1000。
														
 
															+> > - **nms_keep_topk** (int): 进行NMS后，每个图像要保留的总检测框数。默认为100。
														
 
															+> > - **nms_iou_threshold** (float): 进行NMS时，用于剔除检测框IoU的阈值。默认为0.6。
														
 
															+
														
 
															+> - train 训练接口说明同 [PPYOLOv2模型train接口](#train)
														
 
															+> - evaluate 评估接口说明同 [PPYOLOv2模型evaluate接口](#evaluate)
														
 
															+> - predict 预测接口说明同 [PPYOLOv2模型predict接口](#predict)
														
 
															+> - analyze_sensitivity 敏感度分析接口说明同 [PPYOLOv2模型analyze_sensivity接口](#analyze_sensitivity)
														
 
															+> - prune 剪裁接口说明同 [PPYOLOv2模型prune接口](#prune)
														
 
															+> - quant_aware_train 在线量化接口说明同 [PPYOLOv2模型quant_aware_train接口](#quant_aware_train)
														
 
															+
														
 
															+
														
 
															+## <h2 id="5">paddlex.det.YOLOv3</h2>
														
 
															 ```python
														
 
															 paddlex.det.YOLOv3(num_classes=80, backbone='MobileNetV1', anchors=[[10, 13], [16, 30], [33, 23], [30, 61], [62, 45], [59, 119], [116, 90], [156, 198], [373, 326]], anchor_masks=[[6, 7, 8], [3, 4, 5], [0, 1, 2]], ignore_threshold=0.7, nms_score_threshold=0.01, nms_topk=1000, nms_keep_topk=100, nms_iou_threshold=0.45, label_smooth=False)
														
@@ -291,7 +318,7 @@ paddlex.det.YOLOv3(num_classes=80, backbone='MobileNetV1', anchors=[[10, 13], [1
 
															 > - quant_aware_train 在线量化接口说明同 [PPYOLOv2模型quant_aware_train接口](#quant_aware_train)
														
 
															-## <h2 id="5">paddlex.det.FasterRCNN</h2>
														
 
															+## <h2 id="6">paddlex.det.FasterRCNN</h2>
														
 
															 ```python
														
 
															 paddlex.det.FasterRCNN(num_classes=80, backbone='ResNet50', with_fpn=True, aspect_ratios=[0.5, 1.0, 2.0], anchor_sizes=[[32], [64], [128], [256], [512]], keep_top_k=100, nms_threshold=0.5, score_threshold=0.05, fpn_num_channels=256, rpn_batch_size_per_im=256, rpn_fg_fraction=0.5, test_pre_nms_top_n=None, test_post_nms_top_n=1000)
														
--- a/docs/apis/prediction.md
+++ b/docs/apis/prediction.md
@@ -21,7 +21,7 @@ Predict Result: [{'category_id': 549, 'category': 'envelope', 'score': 0.2906293
 
															 ![](images/test.jpg)
														
 
															-- 分类模型predict接口[说明文档](./apis/models/classification.md#predict)
														
 
															+- 分类模型predict接口[说明文档](./models/classification.md#predict)
														
 
															 ## 目标检测
														
--- a/docs/apis/visualize.md
+++ b/docs/apis/visualize.md
@@ -96,7 +96,7 @@ paddlex.det.coco_error_analysis(eval_details_file=None, gt=None, pred_bbox=None,
 
															 ![](images/detection_analysis.jpg)
														
 
															-左图显示的是`person`类的分析结果，有图显示的是所有类别整体的分析结果。
														
 
															+左图显示的是`person`类的分析结果，右图显示的是所有类别整体的分析结果。
														
 
															 分析图表展示了7条Precision-Recall（PR）曲线，每一条曲线表示的Average Precision （AP）比它左边那条高，原因是逐步放宽了评估要求。以`person`类为例，各条PR曲线的评估要求解释如下：
														
--- a/docs/data/annotation/classification.md
+++ b/docs/data/annotation/classification.md
@@ -1,4 +1,4 @@
 
															-# 图像分数据标注
														
 
															+# 图像分类数据标注
														
 
															 图像分类标注是一项最基础，最简单的标注任务，图像分类无需标注工具，只需将属于同一类的图片放在同一个文件夹下即可，例如下所示目录结构，
														
 
															 ```
														
--- a/docs/data/format/detection.md
+++ b/docs/data/format/detection.md
@@ -6,6 +6,7 @@
 
															   * [数据文件夹结构](#11)
														
 
															   * [训练集、验证集列表和类别标签列表](#12)
														
 
															 * [数据加载](#2)
														
 
															+* [添加负样本](#3)
														
 
															 ## <h2 id="1">数据格式</h2>
														
@@ -97,5 +98,44 @@ eval_dataset = pdx.datasets.VOCDetection(
 
															                         file_list='./MyDataset/val_list.txt',
														
 
															                         label_list='MyDataset/labels.txt',
														
 
															                         transforms=eval_transforms)
														
 
															+```
														
 
															+
														
 
															+## <h2 id="3">添加负样本</h2>
														
 
															+
														
 
															+检测任务支持添加负样本进行训练以降低误检率，代码示例如下：
														
 
															+
														
 
															+```python
														
 
															+import paddlex as pdx
														
 
															+from paddlex import transforms as T
														
 
															+
														
 
															+train_transforms = T.Compose([
														
 
															+    T.RandomResizeByShort(
														
 
															+        short_sizes=[640, 672, 704, 736, 768, 800],
														
 
															+        max_size=1333,
														
 
															+        interp='CUBIC'),
														
 
															+    T.RandomHorizontalFlip(),
														
 
															+    T.Normalize(
														
 
															+            mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
														
 
															+])
														
 
															+
														
 
															+# 情况一：train_list中已经包含负样本
														
 
															+train_dataset = pdx.datasets.VOCDetection(
														
 
															+                        data_dir='./MyDataset',
														
 
															+                        file_list='./MyDataset/train_list.txt',
														
 
															+                        label_list='./MyDataset/labels.txt',
														
 
															+                        transforms=train_transforms,
														
 
															+                        allow_empty=True,   # 是否加载负样本
														
 
															+                        empty_ratio=1.)   # 用于指定负样本占总样本数的比例。如果小于0或大于等于1，则保留全部的负样本。默认为1。
														
 
															+
														
 
															+# 情况二：train_list中仅包含正样本，负样本在单独的路径下
														
 
															+train_dataset = pdx.datasets.VOCDetection(
														
 
															+                        data_dir='./MyDataset',
														
 
															+                        file_list='./MyDataset/train_list.txt',
														
 
															+                        label_list='./MyDataset/labels.txt',
														
 
															+                        transforms=train_transforms)
														
 
															+train_dataset.add_negative_samples(
														
 
															+                        image_dir='path/to/negative/images',   # 背景图片所在的文件夹目录。
														
 
															+                        empty_ratio=1)   # 用于指定负样本占总样本数的比例。如果为None，保留数据集初始化是设置的`empty_ratio`值，
														
 
															+                                         # 否则更新原有`empty_ratio`值。如果小于0或大于等于1，则保留全部的负样本。默认为1。
														
 
															 ```
														
--- a/docs/data/format/instance_segmentation.md
+++ b/docs/data/format/instance_segmentation.md
@@ -6,6 +6,7 @@
 
															   * [数据文件夹结构](#11)
														
 
															   * [训练集、验证集列表](#12)
														
 
															 * [数据加载](#2)
														
 
															+* [添加负样本](#3)
														
 
															 ## <h2 id="1">数据格式</h2>
														
@@ -65,3 +66,42 @@ eval_dataset = pdx.dataset.CocoDetection(
 
															                     ann_file='./MyDataset/val.json',
														
 
															                     transforms=eval_transforms)
														
 
															 ```
														
 
															+
														
 
															+
														
 
															+## <h2 id="3">添加负样本</h2>
														
 
															+
														
 
															+实例分割任务支持添加负样本进行训练以降低误检率，代码示例如下：
														
 
															+
														
 
															+```python
														
 
															+import paddlex as pdx
														
 
															+from paddlex import transforms as T
														
 
															+
														
 
															+train_transforms = T.Compose([
														
 
															+    T.RandomResizeByShort(
														
 
															+        short_sizes=[640, 672, 704, 736, 768, 800],
														
 
															+        max_size=1333,
														
 
															+        interp='CUBIC'),
														
 
															+    T.RandomHorizontalFlip(),
														
 
															+    T.Normalize(
														
 
															+            mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
														
 
															+])
														
 
															+
														
 
															+# 情况一：ann_file中已经包含负样本
														
 
															+train_dataset = pdx.dataset.CocoDetection(
														
 
															+                    data_dir='./MyDataset/JPEGImages',
														
 
															+                    ann_file='./MyDataset/train.json',
														
 
															+                    transforms=train_transforms,
														
 
															+                    allow_empty=True,   # 是否加载负样本
														
 
															+                    empty_ratio=1.)   # 用于指定负样本占总样本数的比例。如果小于0或大于等于1，则保留全部的负样本。默认为1。
														
 
															+
														
 
															+# 情况二：train_list中仅包含正样本，负样本在单独的路径下
														
 
															+train_dataset = pdx.dataset.CocoDetection(
														
 
															+                    data_dir='./MyDataset/JPEGImages',
														
 
															+                    ann_file='./MyDataset/train.json',
														
 
															+                    transforms=train_transforms)
														
 
															+train_dataset.add_negative_samples(
														
 
															+                        image_dir='path/to/negative/images',   # 背景图片所在的文件夹目录。
														
 
															+                        empty_ratio=1)   # 用于指定负样本占总样本数的比例。如果为None，保留数据集初始化是设置的`empty_ratio`值，
														
 
															+                                         # 否则更新原有`empty_ratio`值。如果小于0或大于等于1，则保留全部的负样本。默认为1。
														
 
															+
														
 
															+```
														
--- a/docs/gui/README.md
+++ b/docs/gui/README.md
@@ -17,4 +17,4 @@ PaddleX可视化客户端是PaddleX API的衍生品，它在集成API功能的
 
															 ## 安装使用
														
 
															 - 请参考[安装方式文档](./download.md)下载安装PaddleX可视化客户端。
														
 
															-- 请参考[快速开始](./quick_start.md)查看[视频教程](./quick_start.md/#视频教程)和[文档教程](./quick_start.md/#文档教程)。
														
 
															+- 请参考[快速开始](../quick_start_GUI.md)查看[视频教程](../quick_start_GUI.md#视频教程)和[文档教程](../quick_start_GUI.md#文档教程)。
														
--- a/docs/gui/first_meet.md
+++ b/docs/gui/first_meet.md
@@ -0,0 +1,20 @@
 
															+# PaddleX可视化客户端介绍
														
 
															+
														
 
															+PaddleX可视化客户端基于PaddleX开发的可视化深度学习模型训练套件，目前支持训练视觉领域的图像分类、目标检测、实例分割和语义分割四大任务。开发者以点选、键入的方式快速体验深度学习模型开发的全流程。可以作为您提升深度学习模型开发效率的工具。
														
 
															+
														
 
															+PaddleX GUI 当前提供Windows，Mac，Ubuntu三种版本一键绿色安装的方式。请至飞桨官网：https://www.paddlepaddle.org.cn/paddle/paddleX 下载您需要的版本。
														
 
															+
														
 
															+## 功能
														
 
															+PaddleX可视化客户端是PaddleX API的衍生品，它在集成API功能的基础上，额外提供了可视化分析、评估等附加功能，致力于为开发者带来极致顺畅的开发体验。其拥有以下独特的功能：
														
 
															+- **全流程打通**：PaddleX GUI覆盖深度学习模型开发必经的 **数据处理** 、 **超参配置** 、 **模型训练及优化** 、 **模型发布** 全流程，无需开发一行代码，即可得到高性能深度学习推理模型。
														
 
															+- **数据集智能分析**：详细的数据结构说明，并提供 **数据标签自动校验** 。支持 **可视化数据预览** 、 **数据分布图表展示** 、 **一键数据集切分** 等实用功能
														
 
															+- **自动超参推荐**：集成飞桨团队长时间产业实践经验，根据用户选择的模型类别、骨架网络等，提供多种针对性优化的 **预训练模型** ，并 **提供推荐超参配置** ，可 **一键开启多种优化策略**
														
 
															+- **可视化模型评估**：集成 **可视化分析工具：VisualDL** , 以线性图表的形式展示精度、学习率等关键参数在训练过程中的变化趋势。提供 **混淆矩阵** 等实用方法，帮助快速定位问题，加速调参。模型评估报告一键导出，方便项目复盘分析。
														
 
															+- **模型裁剪及量化**：一键启动模型裁剪、量化，在不同阶段为开发者提供模型优化的策略，满足不同环境对模型性能的需求。
														
 
															+- **预训练模型管理**：可对历史训练模型进行保存及管理，未进行裁剪的模型可以保存为预训练模型，在后续任务中使用。
														
 
															+- **可视化模型测试**：客户端直接展示模型预测效果，无需上线即可进行效果评估
														
 
															+- **模型多端部署**：点选式选择模型发布平台、格式，一键导出预测模型，并匹配完善的模型预测部署说明文档，贴心助力产业端到端项目落地
														
 
															+
														
 
															+## 安装使用
														
 
															+- 请参考[安装方式文档](./download.md)下载安装PaddleX可视化客户端。
														
 
															+- 请参考[快速开始](./quick_start.md)查看[视频教程](./quick_start.md/#视频教程)和[文档教程](./quick_start.md/#文档教程)。
														
--- a/docs/quick_start_API.md
+++ b/docs/quick_start_API.md
@@ -3,7 +3,7 @@
 
															 ## 目录
														
 
															 - [快速安装](#快速安装)
														
 
															-    - [PaddleX 2.0.0安装](#PaddleX-200安装)
														
 
															+    - [PaddleX 2.1.0安装](#PaddleX-210安装)
														
 
															     - [PaddleX develop安装](#PaddleX-develop安装)
														
 
															 - [使用前置说明](#使用前置说明)
														
 
															     - [PaddleX的模型训练](#PaddleX的模型训练)
														
@@ -18,17 +18,17 @@
 
															     - <a href=#加载训练保存的模型预测>加载训练保存的模型预测</a>
														
 
															 ## 快速安装
														
 
															-以下安装过程默认用户已安装好**paddlepaddle-gpu或paddlepaddle(版本大于或等于2.1.2)**，paddlepaddle安装方式参照[飞桨官网](https://www.paddlepaddle.org.cn/install/quick?docurl=/documentation/docs/zh/release/2.0.0/install/pip/windows-pip.html)
														
 
															+以下安装过程默认用户已安装好**paddlepaddle-gpu或paddlepaddle(版本大于或等于2.2.0)**，paddlepaddle安装方式参照[飞桨官网](https://www.paddlepaddle.org.cn/install/quick?docurl=/documentation/docs/zh/release/2.0.0/install/pip/windows-pip.html)
														
 
															-### PaddleX 2.0.0安装
														
 
															+### PaddleX 2.1.0安装
														
 
															 **我们推荐大家先安装Anacaonda，而后在新建的conoda环境中使用上述pip安装方式**。Anaconda是一个开源的Python发行版本，其包含了conda、Python等180多个科学包及其依赖项。使用Anaconda可以通过创建多个独立的Python环境，避免用户的Python环境安装太多不同版本依赖导致冲突。参考[Anaconda安装PaddleX文档](./appendix/anaconda_install.md)
														
 
															 - Linux / macOS 操作系统
														
 
															-使用pip安装方式安装2.0.0版本：
														
 
															+使用pip安装方式安装2.1.0版本：
														
 
															 ```commandline
														
 
															-pip install paddlex==2.0.0 -i https://mirror.baidu.com/pypi/simple
														
 
															+pip install paddlex==2.1.0 -i https://mirror.baidu.com/pypi/simple
														
 
															 ```
														
 
															 paddlepaddle已集成pycocotools包，但也有pycocotools无法随paddlepaddle成功安装的情况。因PaddleX依赖pycocotools包，如遇到pycocotools安装失败，可参照如下方式安装pycocotools：
														
@@ -39,10 +39,10 @@ pip install pycocotools
 
															 ```
														
 
															 - Windows 操作系统
														
 
															-使用pip安装方式安装2.0.0版本：
														
 
															+使用pip安装方式安装2.1.0版本：
														
 
															 ```commandline
														
 
															-pip install paddlex==2.0.0 -i https://mirror.baidu.com/pypi/simple
														
 
															+pip install paddlex==2.1.0 -i https://mirror.baidu.com/pypi/simple
														
 
															 ```
														
 
															 因PaddleX依赖pycocotools包，Windows安装时可能会提示`Microsoft Visual C++ 14.0 is required`，从而导致安装出错，[点击下载VC build tools](https://go.microsoft.com/fwlink/?LinkId=691126)安装再执行如下pip命令
														
@@ -65,7 +65,7 @@ pip install -r requirements.txt
 
															 python setup.py install
														
 
															 ```
														
 
															-如遇到pycocotools安装失败，参考[PaddleX 2.0.0安装](./install.md#paddlex-200安装)中介绍的解决方法。
														
 
															+如遇到pycocotools安装失败，参考[PaddleX 2.1.0安装](./install.md#paddlex-210安装)中介绍的解决方法。
														
 
															 ## 使用前置说明
														
--- a/docs/quick_start_GUI.md
+++ b/docs/quick_start_GUI.md
@@ -18,8 +18,8 @@
 
															 ## 快速安装
														
 
															 ### 下载安装
														
 
															 下载地址：https://www.paddlepaddle.org.cn/paddlex
														
 
															-目前最新版本的GUI(Version 2.0.0)仅提供WIN和Linux版，暂未提供Mac版，若需在Mac上使用GUI，推荐安装Mac版历史版本Version 1.1.7
														
 
															-- 特别说明：GUI 2.0要求CUDA >=11.0, cuDNN >= 8.0
														
 
															+目前最新版本的GUI(Version 2.1.0)仅提供WIN和Linux版，暂未提供Mac版，若需在Mac上使用GUI，推荐安装Mac版历史版本Version 1.1.7
														
 
															+- 特别说明：GUI 2.1要求CUDA >=11.0, cuDNN >= 8.0
														
 
															 - WIN版下载后双击选择安装路径即可
														
 
															 - Mac/Linux版下载后解压即可
														
--- a/paddlex/__init__.py
+++ b/paddlex/__init__.py
@@ -12,7 +12,7 @@
 
															 # See the License for the specific language governing permissions and
														
 
															 # limitations under the License.
														
 
															-__version__ = '2.0.0'
														
 
															+__version__ = '2.1.0'
														
 
															 from paddlex.utils.env import get_environ_info, init_parallel_env
														
 
															 init_parallel_env()
														
--- a/paddlex/cls.py
+++ b/paddlex/cls.py
@@ -77,3 +77,6 @@ Xception71 = cv.models.Xception71
 
															 ShuffleNetV2 = cv.models.ShuffleNetV2
														
 
															 ShuffleNetV2_swish = cv.models.ShuffleNetV2_swish
														
 
															+
														
 
															+PPLCNet = cv.models.PPLCNet
														
 
															+PPLCNet_ssld = cv.models.PPLCNet_ssld
														
--- a/paddlex/cv/datasets/voc.py
+++ b/paddlex/cv/datasets/voc.py
@@ -217,8 +217,8 @@ class VOCDetection(Dataset):
 
															                     if not (x2 >= x1 and y2 >= y1):
														
 
															                         logging.warning(
														
 
															-                            "Bounding box for object {} does not satisfy x1 <= x2 and y1 <= y2, "
														
 
															-                            "so this object is skipped".format(i))
														
 
															+                            "Bounding box for object {} does not satisfy xmin {} <= xmax {} and ymin {} <= ymax {}, "
														
 
															+                            "so this object is skipped. xml file: {}".format(i, x1, x2, y1, y2, xml_file))
														
 
															                         continue
														
 
															                     gt_bbox[i, :] = [x1, y1, x2, y2]
														
--- a/paddlex/cv/models/base.py
+++ b/paddlex/cv/models/base.py
@@ -48,6 +48,8 @@ class BaseModel:
 
															         self.train_data_loader = None
														
 
															         self.eval_data_loader = None
														
 
															         self.eval_metrics = None
														
 
															+        self.best_accuracy = -1.
														
 
															+        self.best_model_epoch = -1
														
 
															         # 是否使用多卡间同步BatchNorm均值和方差
														
 
															         self.sync_bn = False
														
 
															         self.status = 'Normal'
														
@@ -115,6 +117,8 @@ class BaseModel:
 
															             with open(osp.join(resume_checkpoint, "model.yml")) as f:
														
 
															                 info = yaml.load(f.read(), Loader=yaml.Loader)
														
 
															                 self.completed_epochs = info['completed_epochs']
														
 
															+                self.best_accuracy = info['_Attributes']['best_accuracy']
														
 
															+                self.best_model_epoch = info['_Attributes']['best_model_epoch']
														
 
															             load_checkpoint(
														
 
															                 self.net,
														
 
															                 self.optimizer,
														
@@ -125,7 +129,12 @@ class BaseModel:
 
															         info = dict()
														
 
															         info['version'] = paddlex.__version__
														
 
															         info['Model'] = self.__class__.__name__
														
 
															-        info['_Attributes'] = {'model_type': self.model_type}
														
 
															+        info['_Attributes'] = dict(
														
 
															+            [('model_type', self.model_type),
														
 
															+             ('num_classes', self.num_classes), ('labels', self.labels),
														
 
															+             ('fixed_input_shape', self.fixed_input_shape),
														
 
															+             ('best_accuracy', self.best_accuracy),
														
 
															+             ('best_model_epoch', self.best_model_epoch)])
														
 
															         if 'self' in self.init_params:
														
 
															             del self.init_params['self']
														
 
															         if '__class__' in self.init_params:
														
@@ -137,10 +146,6 @@ class BaseModel:
 
															         info['_init_params'] = self.init_params
														
 
															-        info['_Attributes']['num_classes'] = self.num_classes
														
 
															-        info['_Attributes']['labels'] = self.labels
														
 
															-        info['_Attributes']['fixed_input_shape'] = self.fixed_input_shape
														
 
															-
														
 
															         try:
														
 
															             primary_metric_key = list(self.eval_metrics.keys())[0]
														
 
															             primary_metric_value = float(self.eval_metrics[primary_metric_key])
														
@@ -317,9 +322,6 @@ class BaseModel:
 
															             eval_batch_size = train_batch_size
														
 
															             eval_epoch_time = 0
														
 
															-        best_accuracy_key = ""
														
 
															-        best_accuracy = -1.0
														
 
															-        best_model_epoch = -1
														
 
															         current_step = 0
														
 
															         for i in range(start_epoch, num_epochs):
														
 
															             self.net.train()
														
@@ -384,11 +386,12 @@ class BaseModel:
 
															                          .format(i + 1, train_avg_metrics.log()))
														
 
															             self.completed_epochs += 1
														
 
															-            # 每间隔save_interval_epochs, 在验证集上评估和对模型进行保存
														
 
															             if ema is not None:
														
 
															                 weight = copy.deepcopy(self.net.state_dict())
														
 
															                 self.net.set_state_dict(ema.apply())
														
 
															             eval_epoch_tic = time.time()
														
 
															+
														
 
															+            # 每间隔save_interval_epochs, 在验证集上评估和对模型进行保存
														
 
															             if (i + 1) % save_interval_epochs == 0 or i == num_epochs - 1:
														
 
															                 if eval_dataset is not None and eval_dataset.num_samples > 0:
														
 
															                     eval_result = self.evaluate(
														
@@ -410,16 +413,16 @@ class BaseModel:
 
															                             i + 1, dict2str(self.eval_metrics)))
														
 
															                         best_accuracy_key = list(self.eval_metrics.keys())[0]
														
 
															                         current_accuracy = self.eval_metrics[best_accuracy_key]
														
 
															-                        if current_accuracy > best_accuracy:
														
 
															-                            best_accuracy = current_accuracy
														
 
															-                            best_model_epoch = i + 1
														
 
															+                        if current_accuracy > self.best_accuracy:
														
 
															+                            self.best_accuracy = current_accuracy
														
 
															+                            self.best_model_epoch = i + 1
														
 
															                             best_model_dir = osp.join(save_dir, "best_model")
														
 
															                             self.save_model(save_dir=best_model_dir)
														
 
															-                        if best_model_epoch > 0:
														
 
															+                        if self.best_model_epoch > 0:
														
 
															                             logging.info(
														
 
															                                 'Current evaluated best model on eval_dataset is epoch_{}, {}={}'
														
 
															-                                .format(best_model_epoch, best_accuracy_key,
														
 
															-                                        best_accuracy))
														
 
															+                                .format(self.best_model_epoch,
														
 
															+                                        best_accuracy_key, self.best_accuracy))
														
 
															                     eval_epoch_time = time.time() - eval_epoch_tic
														
 
															                 current_save_dir = osp.join(save_dir, "epoch_{}".format(i + 1))
														
@@ -444,11 +447,11 @@ class BaseModel:
 
															             criterion({'l1_norm', 'fpgm'}, optional): Pruning criterion. Defaults to 'l1_norm'.
														
 
															             save_dir(str, optional): The directory to save sensitivity file of the model. Defaults to 'output'.
														
 
															         """
														
 
															-        if self.__class__.__name__ in ['FasterRCNN', 'MaskRCNN']:
														
 
															+        if self.__class__.__name__ in {'FasterRCNN', 'MaskRCNN', 'PicoDet'}:
														
 
															             raise Exception("{} does not support pruning currently!".format(
														
 
															                 self.__class__.__name__))
														
 
															-        assert criterion in ['l1_norm', 'fpgm'], \
														
 
															+        assert criterion in {'l1_norm', 'fpgm'}, \
														
 
															             "Pruning criterion {} is not supported. Please choose from ['l1_norm', 'fpgm']"
														
 
															         arrange_transforms(
														
 
															             model_type=self.model_type,
														
--- a/paddlex/cv/models/classifier.py
+++ b/paddlex/cv/models/classifier.py
@@ -37,7 +37,7 @@ __all__ = [
 
															     "DenseNet121", "DenseNet161", "DenseNet169", "DenseNet201", "DenseNet264",
														
 
															     "HRNet_W18_C", "HRNet_W30_C", "HRNet_W32_C", "HRNet_W40_C", "HRNet_W44_C",
														
 
															     "HRNet_W48_C", "HRNet_W64_C", "Xception41", "Xception65", "Xception71",
														
 
															-    "ShuffleNetV2", "ShuffleNetV2_swish"
														
 
															+    "ShuffleNetV2", "ShuffleNetV2_swish", "PPLCNet", "PPLCNet_ssld"
														
 
															 ]
														
@@ -152,58 +152,59 @@ class BaseClassifier(BaseModel):
 
															                           lr_decay_epochs,
														
 
															                           lr_decay_gamma,
														
 
															                           num_steps_each_epoch,
														
 
															-                          decay_coff=1e-04,
														
 
															-                          lr_method='Linear',
														
 
															+                          reg_coeff=1e-04,
														
 
															+                          scheduler='Piecewise',
														
 
															                           num_epochs=None):
														
 
															-        if warmup_steps > 0:
														
 
															-            if lr_method == 'Linear':
														
 
															-                if warmup_steps > lr_decay_epochs[0] * num_steps_each_epoch:
														
 
															-                    logging.error(
														
 
															-                        "In function train(), parameters should satisfy: "
														
 
															-                        "warmup_steps <= lr_decay_epochs[0]*num_samples_in_train_dataset.",
														
 
															-                        exit=False)
														
 
															-                    logging.error(
														
 
															-                        "See this doc for more information: "
														
 
															-                        "https://github.com/PaddlePaddle/PaddleX/blob/develop/docs/parameters.md",
														
 
															-                        exit=False)
														
 
															-                    logging.error(
														
 
															-                        "warmup_steps should be less than {} or lr_decay_epochs[0] greater than {}, "
														
 
															-                        "please modify 'lr_decay_epochs' or 'warmup_steps' in train function".
														
 
															-                        format(lr_decay_epochs[0] * num_steps_each_epoch,
														
 
															-                               warmup_steps // num_steps_each_epoch))
														
 
															-            elif lr_method == 'Cosine':
														
 
															-                if num_epochs is None:
														
 
															-                    logging.error(
														
 
															-                        "num_epochs must be set when using cosine learning rate method, but received is {}".
														
 
															-                        format(num_epochs),
														
 
															-                        exit=False)
														
 
															-                if warmup_steps > num_epochs * num_steps_each_epoch:
														
 
															-                    logging.error(
														
 
															-                        "In function train(), parameters should satisfy: "
														
 
															-                        "warmup_steps <= num_epochs*num_samples_in_train_dataset.",
														
 
															-                        exit=False)
														
 
															-                    logging.error(
														
 
															-                        "See this doc for more information: "
														
 
															-                        "https://github.com/PaddlePaddle/PaddleX/blob/develop/docs/parameters.md",
														
 
															-                        exit=False)
														
 
															-                    logging.error(
														
 
															-                        "warmup_steps should be less than {}, "
														
 
															-                        "please modify 'num_epochs' or 'warmup_steps' in train function".
														
 
															-                        format(num_epochs * num_steps_each_epoch))
														
 
															-        if lr_method == 'Linear':
														
 
															+        if scheduler.lower() == 'piecewise':
														
 
															+            if warmup_steps > 0 and warmup_steps > lr_decay_epochs[
														
 
															+                    0] * num_steps_each_epoch:
														
 
															+                logging.error(
														
 
															+                    "In function train(), parameters must satisfy: "
														
 
															+                    "warmup_steps <= lr_decay_epochs[0] * num_samples_in_train_dataset. "
														
 
															+                    "See this doc for more information: "
														
 
															+                    "https://github.com/PaddlePaddle/PaddleX/blob/develop/docs/parameters.md",
														
 
															+                    exit=False)
														
 
															+                logging.error(
														
 
															+                    "Either `warmup_steps` be less than {} or lr_decay_epochs[0] be greater than {} "
														
 
															+                    "must be satisfied, please modify 'warmup_steps' or 'lr_decay_epochs' in train function".
														
 
															+                    format(lr_decay_epochs[0] * num_steps_each_epoch,
														
 
															+                           warmup_steps // num_steps_each_epoch),
														
 
															+                    exit=True)
														
 
															             boundaries = [b * num_steps_each_epoch for b in lr_decay_epochs]
														
 
															             values = [
														
 
															                 learning_rate * (lr_decay_gamma**i)
														
 
															                 for i in range(len(lr_decay_epochs) + 1)
														
 
															             ]
														
 
															             scheduler = paddle.optimizer.lr.PiecewiseDecay(boundaries, values)
														
 
															-        elif lr_method == 'Cosine':
														
 
															+        elif scheduler.lower() == 'cosine':
														
 
															+            if num_epochs is None:
														
 
															+                logging.error(
														
 
															+                    "`num_epochs` must be set while using cosine annealing decay scheduler, but received {}".
														
 
															+                    format(num_epochs),
														
 
															+                    exit=False)
														
 
															+            if warmup_steps > 0 and warmup_steps > num_epochs * num_steps_each_epoch:
														
 
															+                logging.error(
														
 
															+                    "In function train(), parameters must satisfy: "
														
 
															+                    "warmup_steps <= num_epochs * num_samples_in_train_dataset. "
														
 
															+                    "See this doc for more information: "
														
 
															+                    "https://github.com/PaddlePaddle/PaddleX/blob/develop/docs/parameters.md",
														
 
															+                    exit=False)
														
 
															+                logging.error(
														
 
															+                    "`warmup_steps` must be less than the total number of steps({}), "
														
 
															+                    "please modify 'num_epochs' or 'warmup_steps' in train function".
														
 
															+                    format(num_epochs * num_steps_each_epoch),
														
 
															+                    exit=True)
														
 
															             T_max = num_epochs * num_steps_each_epoch - warmup_steps
														
 
															-            scheduler = paddle.lr.CosineAnnealingDecay(
														
 
															+            scheduler = paddle.optimizer.lr.CosineAnnealingDecay(
														
 
															                 learning_rate=learning_rate,
														
 
															                 T_max=T_max,
														
 
															                 eta_min=0.0,
														
 
															                 last_epoch=-1)
														
 
															+        else:
														
 
															+            logging.error(
														
 
															+                "Invalid learning rate scheduler: {}!".format(scheduler),
														
 
															+                exit=True)
														
 
															+
														
 
															         if warmup_steps > 0:
														
 
															             scheduler = paddle.optimizer.lr.LinearWarmup(
														
 
															                 learning_rate=scheduler,
														
@@ -214,7 +215,7 @@ class BaseClassifier(BaseModel):
 
															         optimizer = paddle.optimizer.Momentum(
														
 
															             scheduler,
														
 
															             momentum=.9,
														
 
															-            weight_decay=paddle.regularizer.L2Decay(coeff=decay_coff),
														
 
															+            weight_decay=paddle.regularizer.L2Decay(coeff=reg_coeff),
														
 
															             parameters=parameters)
														
 
															         return optimizer
														
@@ -873,3 +874,116 @@ class ShuffleNetV2_swish(BaseClassifier):
 
															                 shape=image_shape, name='image', dtype='float32')
														
 
															         ]
														
 
															         return input_spec
														
 
															+
														
 
															+
														
 
															+class PPLCNet(BaseClassifier):
														
 
															+    def __init__(self, num_classes=1000, scale=1., **params):
														
 
															+        supported_scale = [.25, .35, .5, .75, 1., 1.5, 2., 2.5]
														
 
															+        if scale not in supported_scale:
														
 
															+            logging.warning("scale={} is not supported by PPLCNet, "
														
 
															+                            "scale is forcibly set to 1.0".format(scale))
														
 
															+            scale = 1.0
														
 
															+        model_name = 'PPLCNet_x' + str(float(scale)).replace('.', '_')
														
 
															+        super(PPLCNet, self).__init__(
														
 
															+            model_name=model_name, num_classes=num_classes, **params)
														
 
															+
														
 
															+    def train(self,
														
 
															+              num_epochs,
														
 
															+              train_dataset,
														
 
															+              train_batch_size=64,
														
 
															+              eval_dataset=None,
														
 
															+              optimizer=None,
														
 
															+              save_interval_epochs=1,
														
 
															+              log_interval_steps=10,
														
 
															+              save_dir='output',
														
 
															+              pretrain_weights='IMAGENET',
														
 
															+              learning_rate=.1,
														
 
															+              warmup_steps=0,
														
 
															+              warmup_start_lr=0.0,
														
 
															+              lr_decay_epochs=(30, 60, 90),
														
 
															+              lr_decay_gamma=0.1,
														
 
															+              label_smoothing=None,
														
 
															+              early_stop=False,
														
 
															+              early_stop_patience=5,
														
 
															+              use_vdl=True,
														
 
															+              resume_checkpoint=None):
														
 
															+        """
														
 
															+        Train the model.
														
 
															+        Args:
														
 
															+            num_epochs(int): The number of epochs.
														
 
															+            train_dataset(paddlex.dataset): Training dataset.
														
 
															+            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 64.
														
 
															+            eval_dataset(paddlex.dataset, optional):
														
 
															+                Evaluation dataset. If None, the model will not be evaluated during training process. Defaults to None.
														
 
															+            optimizer(paddle.optimizer.Optimizer or None, optional):
														
 
															+                Optimizer used for training. If None, a default optimizer is used. Defaults to None.
														
 
															+            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
														
 
															+            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
														
 
															+            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
														
 
															+            pretrain_weights(str or None, optional):
														
 
															+                None or name/path of pretrained weights. If None, no pretrained weights will be loaded.
														
 
															+                At most one of `resume_checkpoint` and `pretrain_weights` can be set simultaneously.
														
 
															+                Defaults to 'IMAGENET'.
														
 
															+            learning_rate(float, optional): Learning rate for training. Defaults to .025.
														
 
															+            warmup_steps(int, optional): The number of steps of warm-up training. Defaults to 0.
														
 
															+            warmup_start_lr(float, optional): Start learning rate of warm-up training. Defaults to 0..
														
 
															+            lr_decay_epochs(List[int] or Tuple[int], optional):
														
 
															+                Epoch milestones for learning rate decay. Defaults to (20, 60, 90).
														
 
															+            lr_decay_gamma(float, optional): Gamma coefficient of learning rate decay, default .1.
														
 
															+            label_smoothing(float, bool or None, optional): Whether to adopt label smoothing or not.
														
 
															+                If float, the value refer to epsilon coefficient of label smoothing. If False or None, label smoothing
														
 
															+                will not be adopted. Otherwise, adopt label smoothing with epsilon equals to 0.1. Defaults to None.
														
 
															+            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
														
 
															+            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
														
 
															+            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
														
 
															+            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
														
 
															+                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
														
 
															+                `pretrain_weights` can be set simultaneously. Defaults to None.
														
 
															+
														
 
															+        """
														
 
															+        if optimizer is None:
														
 
															+            num_steps_each_epoch = len(train_dataset) // train_batch_size
														
 
															+            optimizer = self.default_optimizer(
														
 
															+                parameters=self.net.parameters(),
														
 
															+                learning_rate=learning_rate,
														
 
															+                warmup_steps=warmup_steps,
														
 
															+                warmup_start_lr=warmup_start_lr,
														
 
															+                lr_decay_epochs=lr_decay_epochs,
														
 
															+                lr_decay_gamma=lr_decay_gamma,
														
 
															+                num_steps_each_epoch=num_steps_each_epoch,
														
 
															+                reg_coeff=3e-5,
														
 
															+                scheduler='Cosine',
														
 
															+                num_epochs=num_epochs)
														
 
															+        super(PPLCNet, self).train(
														
 
															+            num_epochs=num_epochs,
														
 
															+            train_dataset=train_dataset,
														
 
															+            train_batch_size=train_batch_size,
														
 
															+            eval_dataset=eval_dataset,
														
 
															+            optimizer=optimizer,
														
 
															+            save_interval_epochs=save_interval_epochs,
														
 
															+            log_interval_steps=log_interval_steps,
														
 
															+            save_dir=save_dir,
														
 
															+            pretrain_weights=pretrain_weights,
														
 
															+            learning_rate=learning_rate,
														
 
															+            warmup_steps=warmup_steps,
														
 
															+            warmup_start_lr=warmup_start_lr,
														
 
															+            lr_decay_epochs=lr_decay_epochs,
														
 
															+            lr_decay_gamma=lr_decay_gamma,
														
 
															+            label_smoothing=label_smoothing,
														
 
															+            early_stop=early_stop,
														
 
															+            early_stop_patience=early_stop_patience,
														
 
															+            use_vdl=use_vdl,
														
 
															+            resume_checkpoint=resume_checkpoint)
														
 
															+
														
 
															+
														
 
															+class PPLCNet_ssld(PPLCNet):
														
 
															+    def __init__(self, num_classes=1000, scale=1., **params):
														
 
															+        supported_scale = [.5, 1., 2.5]
														
 
															+        if scale not in supported_scale:
														
 
															+            logging.warning("scale={} is not supported by PPLCNet, "
														
 
															+                            "scale is forcibly set to 1.0".format(scale))
														
 
															+            scale = 1.0
														
 
															+        model_name = 'PPLCNet_x' + str(float(scale)).replace('.', '_')
														
 
															+        super(PPLCNet, self).__init__(
														
 
															+            model_name=model_name, num_classes=num_classes, **params)
														
 
															+        self.model_name = model_name + '_ssld'
														
--- a/paddlex/cv/models/detector.py
+++ b/paddlex/cv/models/detector.py
@@ -31,7 +31,7 @@ from paddlex.cv.transforms.batch_operators import BatchCompose, BatchRandomResiz
 
															 from paddlex.cv.transforms import arrange_transforms
														
 
															 from .base import BaseModel
														
 
															 from .utils.det_metrics import VOCMetric, COCOMetric
														
 
															-from .utils.ema import ExponentialMovingAverage
														
 
															+from paddlex.ppdet.optimizer import ModelEMA
														
 
															 from paddlex.utils.checkpoint import det_pretrain_weights_dict
														
 
															 __all__ = [
														
@@ -112,25 +112,66 @@ class BaseDetector(BaseModel):
 
															         return outputs
														
 
															-    def default_optimizer(self, parameters, learning_rate, warmup_steps,
														
 
															-                          warmup_start_lr, lr_decay_epochs, lr_decay_gamma,
														
 
															-                          num_steps_each_epoch):
														
 
															-        boundaries = [b * num_steps_each_epoch for b in lr_decay_epochs]
														
 
															-        values = [(lr_decay_gamma**i) * learning_rate
														
 
															-                  for i in range(len(lr_decay_epochs) + 1)]
														
 
															-        scheduler = paddle.optimizer.lr.PiecewiseDecay(
														
 
															-            boundaries=boundaries, values=values)
														
 
															-        if warmup_steps > 0:
														
 
															-            if warmup_steps > lr_decay_epochs[0] * num_steps_each_epoch:
														
 
															+    def default_optimizer(self,
														
 
															+                          parameters,
														
 
															+                          learning_rate,
														
 
															+                          warmup_steps,
														
 
															+                          warmup_start_lr,
														
 
															+                          lr_decay_epochs,
														
 
															+                          lr_decay_gamma,
														
 
															+                          num_steps_each_epoch,
														
 
															+                          reg_coeff=1e-04,
														
 
															+                          scheduler='Piecewise',
														
 
															+                          num_epochs=None):
														
 
															+        if scheduler.lower() == 'piecewise':
														
 
															+            if warmup_steps > 0 and warmup_steps > lr_decay_epochs[
														
 
															+                    0] * num_steps_each_epoch:
														
 
															+                logging.error(
														
 
															+                    "In function train(), parameters must satisfy: "
														
 
															+                    "warmup_steps <= lr_decay_epochs[0] * num_samples_in_train_dataset. "
														
 
															+                    "See this doc for more information: "
														
 
															+                    "https://github.com/PaddlePaddle/PaddleX/blob/develop/docs/parameters.md",
														
 
															+                    exit=False)
														
 
															+                logging.error(
														
 
															+                    "Either `warmup_steps` be less than {} or lr_decay_epochs[0] be greater than {} "
														
 
															+                    "must be satisfied, please modify 'warmup_steps' or 'lr_decay_epochs' in train function".
														
 
															+                    format(lr_decay_epochs[0] * num_steps_each_epoch,
														
 
															+                           warmup_steps // num_steps_each_epoch),
														
 
															+                    exit=True)
														
 
															+            boundaries = [b * num_steps_each_epoch for b in lr_decay_epochs]
														
 
															+            values = [(lr_decay_gamma**i) * learning_rate
														
 
															+                      for i in range(len(lr_decay_epochs) + 1)]
														
 
															+            scheduler = paddle.optimizer.lr.PiecewiseDecay(boundaries, values)
														
 
															+        elif scheduler.lower() == 'cosine':
														
 
															+            if num_epochs is None:
														
 
															                 logging.error(
														
 
															-                    "In function train(), parameters should satisfy: "
														
 
															-                    "warmup_steps <= lr_decay_epochs[0]*num_samples_in_train_dataset",
														
 
															+                    "`num_epochs` must be set while using cosine annealing decay scheduler, but received {}".
														
 
															+                    format(num_epochs),
														
 
															                     exit=False)
														
 
															+            if warmup_steps > 0 and warmup_steps > num_epochs * num_steps_each_epoch:
														
 
															                 logging.error(
														
 
															+                    "In function train(), parameters must satisfy: "
														
 
															+                    "warmup_steps <= num_epochs * num_samples_in_train_dataset. "
														
 
															                     "See this doc for more information: "
														
 
															                     "https://github.com/PaddlePaddle/PaddleX/blob/develop/docs/parameters.md",
														
 
															                     exit=False)
														
 
															+                logging.error(
														
 
															+                    "`warmup_steps` must be less than the total number of steps({}), "
														
 
															+                    "please modify 'num_epochs' or 'warmup_steps' in train function".
														
 
															+                    format(num_epochs * num_steps_each_epoch),
														
 
															+                    exit=True)
														
 
															+            T_max = num_epochs * num_steps_each_epoch - warmup_steps
														
 
															+            scheduler = paddle.optimizer.lr.CosineAnnealingDecay(
														
 
															+                learning_rate=learning_rate,
														
 
															+                T_max=T_max,
														
 
															+                eta_min=0.0,
														
 
															+                last_epoch=-1)
														
 
															+        else:
														
 
															+            logging.error(
														
 
															+                "Invalid learning rate scheduler: {}!".format(scheduler),
														
 
															+                exit=True)
														
 
															+        if warmup_steps > 0:
														
 
															             scheduler = paddle.optimizer.lr.LinearWarmup(
														
 
															                 learning_rate=scheduler,
														
 
															                 warmup_steps=warmup_steps,
														
@@ -139,7 +180,7 @@ class BaseDetector(BaseModel):
 
															         optimizer = paddle.optimizer.Momentum(
														
 
															             scheduler,
														
 
															             momentum=.9,
														
 
															-            weight_decay=paddle.regularizer.L2Decay(coeff=1e-04),
														
 
															+            weight_decay=paddle.regularizer.L2Decay(coeff=reg_coeff),
														
 
															             parameters=parameters)
														
 
															         return optimizer
														
@@ -275,8 +316,7 @@ class BaseDetector(BaseModel):
 
															                                  'ESNet_' in self.backbone_name))
														
 
															         if use_ema:
														
 
															-            ema = ExponentialMovingAverage(
														
 
															-                decay=.9998, model=self.net, use_thres_step=True)
														
 
															+            ema = ModelEMA(model=self.net, decay=.9998, use_thres_step=True)
														
 
															         else:
														
 
															             ema = None
														
 
															         # start train loop
														
@@ -593,8 +633,8 @@ class PicoDet(BaseDetector):
 
															                  num_classes=80,
														
 
															                  backbone='ESNet_m',
														
 
															                  nms_score_threshold=.025,
														
 
															-                 nms_top_k=1000,
														
 
															-                 nms_keep_top_k=100,
														
 
															+                 nms_topk=1000,
														
 
															+                 nms_keep_topk=100,
														
 
															                  nms_iou_threshold=.6,
														
 
															                  **params):
														
 
															         self.init_params = locals()
														
@@ -691,8 +731,8 @@ class PicoDet(BaseDetector):
 
															             assigner = ppdet.modeling.SimOTAAssigner(
														
 
															                 candidate_topk=10, iou_weight=6, num_classes=num_classes)
														
 
															             nms = ppdet.modeling.MultiClassNMS(
														
 
															-                nms_top_k=nms_top_k,
														
 
															-                keep_top_k=nms_keep_top_k,
														
 
															+                nms_top_k=nms_topk,
														
 
															+                keep_top_k=nms_keep_topk,
														
 
															                 score_threshold=nms_score_threshold,
														
 
															                 nms_threshold=nms_iou_threshold)
														
 
															             head = ppdet.modeling.PicoHead(
														
@@ -783,6 +823,92 @@ class PicoDet(BaseDetector):
 
															         self.fixed_input_shape = image_shape
														
 
															         return self._define_input_spec(image_shape)
														
 
															+    def train(self,
														
 
															+              num_epochs,
														
 
															+              train_dataset,
														
 
															+              train_batch_size=64,
														
 
															+              eval_dataset=None,
														
 
															+              optimizer=None,
														
 
															+              save_interval_epochs=1,
														
 
															+              log_interval_steps=10,
														
 
															+              save_dir='output',
														
 
															+              pretrain_weights='IMAGENET',
														
 
															+              learning_rate=.001,
														
 
															+              warmup_steps=0,
														
 
															+              warmup_start_lr=0.0,
														
 
															+              lr_decay_epochs=(216, 243),
														
 
															+              lr_decay_gamma=0.1,
														
 
															+              metric=None,
														
 
															+              use_ema=False,
														
 
															+              early_stop=False,
														
 
															+              early_stop_patience=5,
														
 
															+              use_vdl=True,
														
 
															+              resume_checkpoint=None):
														
 
															+        """
														
 
															+        Train the model.
														
 
															+        Args:
														
 
															+            num_epochs(int): The number of epochs.
														
 
															+            train_dataset(paddlex.dataset): Training dataset.
														
 
															+            train_batch_size(int, optional): Total batch size among all cards used in training. Defaults to 64.
														
 
															+            eval_dataset(paddlex.dataset, optional):
														
 
															+                Evaluation dataset. If None, the model will not be evaluated during training process. Defaults to None.
														
 
															+            optimizer(paddle.optimizer.Optimizer or None, optional):
														
 
															+                Optimizer used for training. If None, a default optimizer is used. Defaults to None.
														
 
															+            save_interval_epochs(int, optional): Epoch interval for saving the model. Defaults to 1.
														
 
															+            log_interval_steps(int, optional): Step interval for printing training information. Defaults to 10.
														
 
															+            save_dir(str, optional): Directory to save the model. Defaults to 'output'.
														
 
															+            pretrain_weights(str or None, optional):
														
 
															+                None or name/path of pretrained weights. If None, no pretrained weights will be loaded. Defaults to 'IMAGENET'.
														
 
															+            learning_rate(float, optional): Learning rate for training. Defaults to .001.
														
 
															+            warmup_steps(int, optional): The number of steps of warm-up training. Defaults to 0.
														
 
															+            warmup_start_lr(float, optional): Start learning rate of warm-up training. Defaults to 0..
														
 
															+            lr_decay_epochs(list or tuple, optional): Epoch milestones for learning rate decay. Defaults to (216, 243).
														
 
															+            lr_decay_gamma(float, optional): Gamma coefficient of learning rate decay. Defaults to .1.
														
 
															+            metric({'VOC', 'COCO', None}, optional):
														
 
															+                Evaluation metric. If None, determine the metric according to the dataset format. Defaults to None.
														
 
															+            use_ema(bool, optional): Whether to use exponential moving average strategy. Defaults to False.
														
 
															+            early_stop(bool, optional): Whether to adopt early stop strategy. Defaults to False.
														
 
															+            early_stop_patience(int, optional): Early stop patience. Defaults to 5.
														
 
															+            use_vdl(bool, optional): Whether to use VisualDL to monitor the training process. Defaults to True.
														
 
															+            resume_checkpoint(str or None, optional): The path of the checkpoint to resume training from.
														
 
															+                If None, no training checkpoint will be resumed. At most one of `resume_checkpoint` and
														
 
															+                `pretrain_weights` can be set simultaneously. Defaults to None.
														
 
															+        """
														
 
															+        if optimizer is None:
														
 
															+            num_steps_each_epoch = len(train_dataset) // train_batch_size
														
 
															+            optimizer = self.default_optimizer(
														
 
															+                parameters=self.net.parameters(),
														
 
															+                learning_rate=learning_rate,
														
 
															+                warmup_steps=warmup_steps,
														
 
															+                warmup_start_lr=warmup_start_lr,
														
 
															+                lr_decay_epochs=lr_decay_epochs,
														
 
															+                lr_decay_gamma=lr_decay_gamma,
														
 
															+                num_steps_each_epoch=num_steps_each_epoch,
														
 
															+                reg_coeff=4e-05,
														
 
															+                scheduler='Cosine',
														
 
															+                num_epochs=num_epochs)
														
 
															+        super(PicoDet, self).train(
														
 
															+            num_epochs=num_epochs,
														
 
															+            train_dataset=train_dataset,
														
 
															+            train_batch_size=train_batch_size,
														
 
															+            eval_dataset=eval_dataset,
														
 
															+            optimizer=optimizer,
														
 
															+            save_interval_epochs=save_interval_epochs,
														
 
															+            log_interval_steps=log_interval_steps,
														
 
															+            save_dir=save_dir,
														
 
															+            pretrain_weights=pretrain_weights,
														
 
															+            learning_rate=learning_rate,
														
 
															+            warmup_steps=warmup_steps,
														
 
															+            warmup_start_lr=warmup_start_lr,
														
 
															+            lr_decay_epochs=lr_decay_epochs,
														
 
															+            lr_decay_gamma=lr_decay_gamma,
														
 
															+            metric=metric,
														
 
															+            use_ema=use_ema,
														
 
															+            early_stop=early_stop,
														
 
															+            early_stop_patience=early_stop_patience,
														
 
															+            use_vdl=use_vdl,
														
 
															+            resume_checkpoint=resume_checkpoint)
														
 
															+
														
 
															 class YOLOv3(BaseDetector):
														
 
															     def __init__(self,
														
@@ -1226,42 +1352,22 @@ class FasterRCNN(BaseDetector):
 
															         """
														
 
															         if train_dataset.pos_num < len(train_dataset.file_list):
														
 
															             train_dataset.num_workers = 0
														
 
															-            if train_batch_size != 1:
														
 
															-                train_batch_size = 1
														
 
															-                logging.warning(
														
 
															-                    "Training RCNN models with negative samples only support batch size equals to 1 "
														
 
															-                    "on a single gpu/cpu card, `train_batch_size` is forcibly set to 1."
														
 
															-                )
														
 
															-            nranks = paddle.distributed.get_world_size()
														
 
															-            local_rank = paddle.distributed.get_rank()
														
 
															-            # single card training
														
 
															-            if nranks < 2 or local_rank == 0:
														
 
															-                super(FasterRCNN, self).train(
														
 
															-                    num_epochs, train_dataset, train_batch_size, eval_dataset,
														
 
															-                    optimizer, save_interval_epochs, log_interval_steps,
														
 
															-                    save_dir, pretrain_weights, learning_rate, warmup_steps,
														
 
															-                    warmup_start_lr, lr_decay_epochs, lr_decay_gamma, metric,
														
 
															-                    use_ema, early_stop, early_stop_patience, use_vdl,
														
 
															-                    resume_checkpoint)
														
 
															-        else:
														
 
															-            super(FasterRCNN, self).train(
														
 
															-                num_epochs, train_dataset, train_batch_size, eval_dataset,
														
 
															-                optimizer, save_interval_epochs, log_interval_steps, save_dir,
														
 
															-                pretrain_weights, learning_rate, warmup_steps, warmup_start_lr,
														
 
															-                lr_decay_epochs, lr_decay_gamma, metric, use_ema, early_stop,
														
 
															-                early_stop_patience, use_vdl, resume_checkpoint)
														
 
															+        super(FasterRCNN, self).train(
														
 
															+            num_epochs, train_dataset, train_batch_size, eval_dataset,
														
 
															+            optimizer, save_interval_epochs, log_interval_steps, save_dir,
														
 
															+            pretrain_weights, learning_rate, warmup_steps, warmup_start_lr,
														
 
															+            lr_decay_epochs, lr_decay_gamma, metric, use_ema, early_stop,
														
 
															+            early_stop_patience, use_vdl, resume_checkpoint)
														
 
															     def _compose_batch_transform(self, transforms, mode='train'):
														
 
															         if mode == 'train':
														
 
															             default_batch_transforms = [
														
 
															                 _BatchPadding(pad_to_stride=32 if self.with_fpn else -1)
														
 
															             ]
														
 
															-            collate_batch = False
														
 
															         else:
														
 
															             default_batch_transforms = [
														
 
															                 _BatchPadding(pad_to_stride=32 if self.with_fpn else -1)
														
 
															             ]
														
 
															-            collate_batch = True
														
 
															         custom_batch_transforms = []
														
 
															         for i, op in enumerate(transforms.transforms):
														
 
															             if isinstance(op, (BatchRandomResize, BatchRandomResizeByShort)):
														
@@ -1274,7 +1380,7 @@ class FasterRCNN(BaseDetector):
 
															         batch_transforms = BatchCompose(
														
 
															             custom_batch_transforms + default_batch_transforms,
														
 
															-            collate_batch=collate_batch)
														
 
															+            collate_batch=False)
														
 
															         return batch_transforms
														
@@ -2074,42 +2180,22 @@ class MaskRCNN(BaseDetector):
 
															         """
														
 
															         if train_dataset.pos_num < len(train_dataset.file_list):
														
 
															             train_dataset.num_workers = 0
														
 
															-            if train_batch_size != 1:
														
 
															-                train_batch_size = 1
														
 
															-                logging.warning(
														
 
															-                    "Training RCNN models with negative samples only support batch size equals to 1 "
														
 
															-                    "on a single gpu/cpu card, `train_batch_size` is forcibly set to 1."
														
 
															-                )
														
 
															-            nranks = paddle.distributed.get_world_size()
														
 
															-            local_rank = paddle.distributed.get_rank()
														
 
															-            # single card training
														
 
															-            if nranks < 2 or local_rank == 0:
														
 
															-                super(MaskRCNN, self).train(
														
 
															-                    num_epochs, train_dataset, train_batch_size, eval_dataset,
														
 
															-                    optimizer, save_interval_epochs, log_interval_steps,
														
 
															-                    save_dir, pretrain_weights, learning_rate, warmup_steps,
														
 
															-                    warmup_start_lr, lr_decay_epochs, lr_decay_gamma, metric,
														
 
															-                    use_ema, early_stop, early_stop_patience, use_vdl,
														
 
															-                    resume_checkpoint)
														
 
															-        else:
														
 
															-            super(MaskRCNN, self).train(
														
 
															-                num_epochs, train_dataset, train_batch_size, eval_dataset,
														
 
															-                optimizer, save_interval_epochs, log_interval_steps, save_dir,
														
 
															-                pretrain_weights, learning_rate, warmup_steps, warmup_start_lr,
														
 
															-                lr_decay_epochs, lr_decay_gamma, metric, use_ema, early_stop,
														
 
															-                early_stop_patience, use_vdl, resume_checkpoint)
														
 
															+        super(MaskRCNN, self).train(
														
 
															+            num_epochs, train_dataset, train_batch_size, eval_dataset,
														
 
															+            optimizer, save_interval_epochs, log_interval_steps, save_dir,
														
 
															+            pretrain_weights, learning_rate, warmup_steps, warmup_start_lr,
														
 
															+            lr_decay_epochs, lr_decay_gamma, metric, use_ema, early_stop,
														
 
															+            early_stop_patience, use_vdl, resume_checkpoint)
														
 
															     def _compose_batch_transform(self, transforms, mode='train'):
														
 
															         if mode == 'train':
														
 
															             default_batch_transforms = [
														
 
															                 _BatchPadding(pad_to_stride=32 if self.with_fpn else -1)
														
 
															             ]
														
 
															-            collate_batch = False
														
 
															         else:
														
 
															             default_batch_transforms = [
														
 
															                 _BatchPadding(pad_to_stride=32 if self.with_fpn else -1)
														
 
															             ]
														
 
															-            collate_batch = True
														
 
															         custom_batch_transforms = []
														
 
															         for i, op in enumerate(transforms.transforms):
														
 
															             if isinstance(op, (BatchRandomResize, BatchRandomResizeByShort)):
														
@@ -2122,7 +2208,7 @@ class MaskRCNN(BaseDetector):
 
															         batch_transforms = BatchCompose(
														
 
															             custom_batch_transforms + default_batch_transforms,
														
 
															-            collate_batch=collate_batch)
														
 
															+            collate_batch=False)
														
 
															         return batch_transforms
														
--- a/paddlex/cv/models/utils/ema.py
+++ b/paddlex/cv/models/utils/ema.py
@@ -1,48 +0,0 @@
 
															-# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
														
 
															-#
														
 
															-# Licensed under the Apache License, Version 2.0 (the "License");
														
 
															-# you may not use this file except in compliance with the License.
														
 
															-# You may obtain a copy of the License at
														
 
															-#
														
 
															-#    http://www.apache.org/licenses/LICENSE-2.0
														
 
															-#
														
 
															-# Unless required by applicable law or agreed to in writing, software
														
 
															-# distributed under the License is distributed on an "AS IS" BASIS,
														
 
															-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															-# See the License for the specific language governing permissions and
														
 
															-# limitations under the License.
														
 
															-
														
 
															-import paddle
														
 
															-
														
 
															-
														
 
															-class ExponentialMovingAverage(object):
														
 
															-    def __init__(self, decay, model, use_thres_step=False):
														
 
															-        self.step = 0
														
 
															-        self.decay = decay
														
 
															-        self.shadow = dict()
														
 
															-        for k, v in model.state_dict().items():
														
 
															-            self.shadow[k] = paddle.zeros_like(v)
														
 
															-        self.use_thres_step = use_thres_step
														
 
															-
														
 
															-    def update(self, model):
														
 
															-        if self.use_thres_step:
														
 
															-            decay = min(self.decay, (1 + self.step) / (10 + self.step))
														
 
															-        else:
														
 
															-            decay = self.decay
														
 
															-        self._decay = decay
														
 
															-        model_dict = model.state_dict()
														
 
															-        for k, v in self.shadow.items():
														
 
															-            v = decay * v + (1 - decay) * model_dict[k]
														
 
															-            v.stop_gradient = True
														
 
															-            self.shadow[k] = v
														
 
															-        self.step += 1
														
 
															-
														
 
															-    def apply(self):
														
 
															-        if self.step == 0:
														
 
															-            return self.shadow
														
 
															-        state_dict = dict()
														
 
															-        for k, v in self.shadow.items():
														
 
															-            v = v / (1 - self._decay**self.step)
														
 
															-            v.stop_gradient = True
														
 
															-            state_dict[k] = v
														
 
															-        return state_dict
														
--- a/paddlex/paddleseg/cvlibs/param_init.py
+++ b/paddlex/paddleseg/cvlibs/param_init.py
@@ -58,7 +58,7 @@ def normal_init(param, **kwargs):
 
															 def kaiming_normal_init(param, **kwargs):
														
 
															-    """
														
 
															+    r"""
														
 
															     Initialize the input tensor with Kaiming Normal initialization.
														
 
															     This function implements the `param` initialization from the paper
														
--- a/paddlex/paddleseg/models/losses/binary_cross_entropy_loss.py
+++ b/paddlex/paddleseg/models/losses/binary_cross_entropy_loss.py
@@ -21,7 +21,7 @@ from paddlex.paddleseg.cvlibs import manager
 
															 @manager.LOSSES.add_component
														
 
															 class BCELoss(nn.Layer):
														
 
															-    """
														
 
															+    r"""
														
 
															     This operator combines the sigmoid layer and the :ref:`api_nn_loss_BCELoss` layer.
														
 
															     Also, we can see it as the combine of ``sigmoid_cross_entropy_with_logits``
														
 
															     layer and some reduce operations.
														
--- a/paddlex/paddleseg/models/losses/lovasz_loss.py
+++ b/paddlex/paddleseg/models/losses/lovasz_loss.py
@@ -41,7 +41,7 @@ class LovaszSoftmaxLoss(nn.Layer):
 
															         self.classes = classes
														
 
															     def forward(self, logits, labels):
														
 
															-        """
														
 
															+        r"""
														
 
															         Forward computation.
														
 
															         Args:
														
@@ -68,7 +68,7 @@ class LovaszHingeLoss(nn.Layer):
 
															         self.ignore_index = ignore_index
														
 
															     def forward(self, logits, labels):
														
 
															-        """
														
 
															+        r"""
														
 
															         Forward computation.
														
 
															         Args:
														
@@ -111,7 +111,7 @@ def binary_channel_to_unary(logits, eps=1e-9):
 
															 def lovasz_hinge_flat(logits, labels):
														
 
															-    """
														
 
															+    r"""
														
 
															     Binary Lovasz hinge loss.
														
 
															     Args:
														
--- a/paddlex/ppdet/engine/trainer.py
+++ b/paddlex/ppdet/engine/trainer.py
@@ -33,6 +33,7 @@ from paddle.static import InputSpec
 
															 from paddlex.ppdet.optimizer import ModelEMA
														
 
															 from paddlex.ppdet.core.workspace import create
														
 
															+from paddlex.ppdet.modeling.architectures.meta_arch import BaseArch
														
 
															 from paddlex.ppdet.utils.checkpoint import load_weight, load_pretrain_weight
														
 
															 from paddlex.ppdet.utils.visualizer import visualize_results, save_result
														
 
															 from paddlex.ppdet.metrics import Metric, COCOMetric, VOCMetric, WiderFaceMetric, get_infer_results, KeyPointTopDownCOCOEval, KeyPointTopDownMPIIEval
														
@@ -111,8 +112,12 @@ class Trainer(object):
 
															         if self.mode == 'eval':
														
 
															             self._eval_batch_sampler = paddle.io.BatchSampler(
														
 
															                 self.dataset, batch_size=self.cfg.EvalReader['batch_size'])
														
 
															-            self.loader = create('{}Reader'.format(self.mode.capitalize()))(
														
 
															-                self.dataset, cfg.worker_num, self._eval_batch_sampler)
														
 
															+            reader_name = '{}Reader'.format(self.mode.capitalize())
														
 
															+            # If metric is VOC, need to be set collate_batch=False.
														
 
															+            if cfg.metric == 'VOC':
														
 
															+                cfg[reader_name]['collate_batch'] = False
														
 
															+            self.loader = create(reader_name)(self.dataset, cfg.worker_num,
														
 
															+                                              self._eval_batch_sampler)
														
 
															         # TestDataset build after user set images, skip loader creation here
														
 
															         # build optimizer in train mode
														
@@ -336,6 +341,12 @@ class Trainer(object):
 
															         assert self.mode == 'train', "Model not in 'train' mode"
														
 
															         Init_mark = False
														
 
															+        sync_bn = (
														
 
															+            getattr(self.cfg, 'norm_type', None) in [None, 'sync_bn'] and
														
 
															+            self.cfg.use_gpu and self._nranks > 1)
														
 
															+        if sync_bn:
														
 
															+            self.model = BaseArch.convert_sync_batchnorm(self.model)
														
 
															+
														
 
															         model = self.model
														
 
															         if self.cfg.get('fleet', False):
														
 
															             model = fleet.distributed_model(model)
														
@@ -364,7 +375,9 @@ class Trainer(object):
 
															         self.status['training_staus'] = stats.TrainingStats(self.cfg.log_iter)
														
 
															         if self.cfg.get('print_flops', False):
														
 
															-            self._flops(self.loader)
														
 
															+            flops_loader = create('{}Reader'.format(self.mode.capitalize()))(
														
 
															+                self.dataset, self.cfg.worker_num)
														
 
															+            self._flops(flops_loader)
														
 
															         profiler_options = self.cfg.get('profiler_options', None)
														
 
															         self._compose_callback.on_train_begin(self.status)
														
@@ -436,6 +449,9 @@ class Trainer(object):
 
															                         paddle.io.BatchSampler(
														
 
															                             self._eval_dataset,
														
 
															                             batch_size=self.cfg.EvalReader['batch_size'])
														
 
															+                    # If metric is VOC, need to be set collate_batch=False.
														
 
															+                    if self.cfg.metric == 'VOC':
														
 
															+                        self.cfg['EvalReader']['collate_batch'] = False
														
 
															                     self._eval_loader = create('EvalReader')(
														
 
															                         self._eval_dataset,
														
 
															                         self.cfg.worker_num,
														
@@ -463,7 +479,9 @@ class Trainer(object):
 
															         self.status['mode'] = 'eval'
														
 
															         self.model.eval()
														
 
															         if self.cfg.get('print_flops', False):
														
 
															-            self._flops(loader)
														
 
															+            flops_loader = create('{}Reader'.format(self.mode.capitalize()))(
														
 
															+                self.dataset, self.cfg.worker_num, self._eval_batch_sampler)
														
 
															+            self._flops(flops_loader)
														
 
															         for step_id, data in enumerate(loader):
														
 
															             self.status['step_id'] = step_id
														
 
															             self._compose_callback.on_step_begin(self.status)
														
@@ -514,7 +532,8 @@ class Trainer(object):
 
															         self.status['mode'] = 'test'
														
 
															         self.model.eval()
														
 
															         if self.cfg.get('print_flops', False):
														
 
															-            self._flops(loader)
														
 
															+            flops_loader = create('TestReader')(self.dataset, 0)
														
 
															+            self._flops(flops_loader)
														
 
															         results = []
														
 
															         for step_id, data in enumerate(loader):
														
 
															             self.status['step_id'] = step_id
														
--- a/paddlex/ppdet/model_zoo/tests/__init__.py
+++ b/paddlex/ppdet/model_zoo/tests/__init__.py
@@ -1,13 +0,0 @@
 
															-#   Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
														
 
															-#
														
 
															-# Licensed under the Apache License, Version 2.0 (the "License");
														
 
															-# you may not use this file except in compliance with the License.
														
 
															-# You may obtain a copy of the License at
														
 
															-#
														
 
															-#     http://www.apache.org/licenses/LICENSE-2.0
														
 
															-#
														
 
															-# Unless required by applicable law or agreed to in writing, software
														
 
															-# distributed under the License is distributed on an "AS IS" BASIS,
														
 
															-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															-# See the License for the specific language governing permissions and
														
 
															-# limitations under the License.
														
--- a/paddlex/ppdet/model_zoo/tests/test_get_model.py
+++ b/paddlex/ppdet/model_zoo/tests/test_get_model.py
@@ -1,48 +0,0 @@
 
															-#   Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
														
 
															-#
														
 
															-# Licensed under the Apache License, Version 2.0 (the "License");
														
 
															-# you may not use this file except in compliance with the License.
														
 
															-# You may obtain a copy of the License at
														
 
															-#
														
 
															-#     http://www.apache.org/licenses/LICENSE-2.0
														
 
															-#
														
 
															-# Unless required by applicable law or agreed to in writing, software
														
 
															-# distributed under the License is distributed on an "AS IS" BASIS,
														
 
															-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															-# See the License for the specific language governing permissions and
														
 
															-# limitations under the License.
														
 
															-
														
 
															-from __future__ import absolute_import
														
 
															-from __future__ import division
														
 
															-from __future__ import print_function
														
 
															-
														
 
															-import os
														
 
															-import paddle
														
 
															-import paddlex.ppdet
														
 
															-import unittest
														
 
															-
														
 
															-# NOTE: weights downloading costs time, we choose
														
 
															-#       a small model for unittesting
														
 
															-MODEL_NAME = 'ppyolo/ppyolo_tiny_650e_coco'
														
 
															-
														
 
															-
														
 
															-class TestGetConfigFile(unittest.TestCase):
														
 
															-    def test_main(self):
														
 
															-        try:
														
 
															-            cfg_file = ppdet.model_zoo.get_config_file(MODEL_NAME)
														
 
															-            assert os.path.isfile(cfg_file)
														
 
															-        except:
														
 
															-            self.assertTrue(False)
														
 
															-
														
 
															-
														
 
															-class TestGetModel(unittest.TestCase):
														
 
															-    def test_main(self):
														
 
															-        try:
														
 
															-            model = ppdet.model_zoo.get_model(MODEL_NAME)
														
 
															-            assert isinstance(model, paddle.nn.Layer)
														
 
															-        except:
														
 
															-            self.assertTrue(False)
														
 
															-
														
 
															-
														
 
															-if __name__ == '__main__':
														
 
															-    unittest.main()
														
--- a/paddlex/ppdet/model_zoo/tests/test_list_model.py
+++ b/paddlex/ppdet/model_zoo/tests/test_list_model.py
@@ -1,68 +0,0 @@
 
															-#   Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
														
 
															-#
														
 
															-# Licensed under the Apache License, Version 2.0 (the "License");
														
 
															-# you may not use this file except in compliance with the License.
														
 
															-# You may obtain a copy of the License at
														
 
															-#
														
 
															-#     http://www.apache.org/licenses/LICENSE-2.0
														
 
															-#
														
 
															-# Unless required by applicable law or agreed to in writing, software
														
 
															-# distributed under the License is distributed on an "AS IS" BASIS,
														
 
															-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															-# See the License for the specific language governing permissions and
														
 
															-# limitations under the License.
														
 
															-
														
 
															-from __future__ import absolute_import
														
 
															-from __future__ import division
														
 
															-from __future__ import print_function
														
 
															-
														
 
															-import unittest
														
 
															-import paddlex.ppdet
														
 
															-
														
 
															-
														
 
															-class TestListModel(unittest.TestCase):
														
 
															-    def setUp(self):
														
 
															-        self._filter = []
														
 
															-
														
 
															-    def test_main(self):
														
 
															-        try:
														
 
															-            ppdet.model_zoo.list_model(self._filter)
														
 
															-            self.assertTrue(True)
														
 
															-        except:
														
 
															-            self.assertTrue(False)
														
 
															-
														
 
															-
														
 
															-class TestListModelYOLO(TestListModel):
														
 
															-    def setUp(self):
														
 
															-        self._filter = ['yolo']
														
 
															-
														
 
															-
														
 
															-class TestListModelRCNN(TestListModel):
														
 
															-    def setUp(self):
														
 
															-        self._filter = ['rcnn']
														
 
															-
														
 
															-
														
 
															-class TestListModelSSD(TestListModel):
														
 
															-    def setUp(self):
														
 
															-        self._filter = ['ssd']
														
 
															-
														
 
															-
														
 
															-class TestListModelMultiFilter(TestListModel):
														
 
															-    def setUp(self):
														
 
															-        self._filter = ['yolo', 'darknet']
														
 
															-
														
 
															-
														
 
															-class TestListModelError(unittest.TestCase):
														
 
															-    def setUp(self):
														
 
															-        self._filter = ['xxx']
														
 
															-
														
 
															-    def test_main(self):
														
 
															-        try:
														
 
															-            ppdet.model_zoo.list_model(self._filter)
														
 
															-            self.assertTrue(False)
														
 
															-        except ValueError:
														
 
															-            self.assertTrue(True)
														
 
															-
														
 
															-
														
 
															-if __name__ == '__main__':
														
 
															-    unittest.main()
														
--- a/paddlex/ppdet/modeling/architectures/meta_arch.py
+++ b/paddlex/ppdet/modeling/architectures/meta_arch.py
@@ -126,3 +126,16 @@ class BaseArch(nn.Layer):
 
															     def get_pred(self, ):
														
 
															         raise NotImplementedError("Should implement get_pred method!")
														
 
															+
														
 
															+    @classmethod
														
 
															+    def convert_sync_batchnorm(cls, layer):
														
 
															+        layer_output = layer
														
 
															+        if getattr(layer, 'norm_type', None) == 'sync_bn':
														
 
															+            layer_output = nn.SyncBatchNorm.convert_sync_batchnorm(layer)
														
 
															+        else:
														
 
															+            for name, sublayer in layer.named_children():
														
 
															+                layer_output.add_sublayer(name,
														
 
															+                                          cls.convert_sync_batchnorm(sublayer))
														
 
															+
														
 
															+        del layer
														
 
															+        return layer_output
														
--- a/paddlex/ppdet/modeling/backbones/blazenet.py
+++ b/paddlex/ppdet/modeling/backbones/blazenet.py
@@ -58,11 +58,8 @@ class ConvBNLayer(nn.Layer):
 
															                 learning_rate=conv_lr, initializer=KaimingNormal()),
														
 
															             bias_attr=False)
														
 
															-        if norm_type == 'sync_bn':
														
 
															-            self._batch_norm = nn.SyncBatchNorm(out_channels)
														
 
															-        else:
														
 
															-            self._batch_norm = nn.BatchNorm(
														
 
															-                out_channels, act=None, use_global_stats=False)
														
 
															+        if norm_type in ['bn', 'sync_bn']:
														
 
															+            self._batch_norm = nn.BatchNorm2D(out_channels)
														
 
															     def forward(self, x):
														
 
															         x = self._conv(x)
														
--- a/paddlex/ppdet/modeling/backbones/esnet.py
+++ b/paddlex/ppdet/modeling/backbones/esnet.py
@@ -20,7 +20,7 @@ import paddle
 
															 import paddle.nn as nn
														
 
															 import paddle.nn.functional as F
														
 
															 from paddle import ParamAttr
														
 
															-from paddle.nn import Conv2D, MaxPool2D, AdaptiveAvgPool2D, BatchNorm
														
 
															+from paddle.nn import Conv2D, MaxPool2D, AdaptiveAvgPool2D
														
 
															 from paddle.nn.initializer import KaimingNormal
														
 
															 from paddle.regularizer import L2Decay
														
--- a/paddlex/ppdet/modeling/backbones/hrnet.py
+++ b/paddlex/ppdet/modeling/backbones/hrnet.py
@@ -62,11 +62,11 @@ class ConvNormLayer(nn.Layer):
 
															             learning_rate=norm_lr, regularizer=L2Decay(norm_decay))
														
 
															         bias_attr = ParamAttr(
														
 
															             learning_rate=norm_lr, regularizer=L2Decay(norm_decay))
														
 
															-        global_stats = True if freeze_norm else False
														
 
															+        global_stats = True if freeze_norm else None
														
 
															         if norm_type in ['bn', 'sync_bn']:
														
 
															-            self.norm = nn.BatchNorm(
														
 
															+            self.norm = nn.BatchNorm2D(
														
 
															                 ch_out,
														
 
															-                param_attr=param_attr,
														
 
															+                weight_attr=param_attr,
														
 
															                 bias_attr=bias_attr,
														
 
															                 use_global_stats=global_stats)
														
 
															         elif norm_type == 'gn':
														
--- a/paddlex/ppdet/modeling/backbones/lcnet.py
+++ b/paddlex/ppdet/modeling/backbones/lcnet.py
@@ -19,7 +19,7 @@ from __future__ import print_function
 
															 import paddle
														
 
															 import paddle.nn as nn
														
 
															 from paddle import ParamAttr
														
 
															-from paddle.nn import AdaptiveAvgPool2D, BatchNorm, Conv2D, Dropout, Linear
														
 
															+from paddle.nn import AdaptiveAvgPool2D, Conv2D
														
 
															 from paddle.regularizer import L2Decay
														
 
															 from paddle.nn.initializer import KaimingNormal
														
@@ -81,9 +81,9 @@ class ConvBNLayer(nn.Layer):
 
															             weight_attr=ParamAttr(initializer=KaimingNormal()),
														
 
															             bias_attr=False)
														
 
															-        self.bn = BatchNorm(
														
 
															+        self.bn = nn.BatchNorm2D(
														
 
															             num_filters,
														
 
															-            param_attr=ParamAttr(regularizer=L2Decay(0.0)),
														
 
															+            weight_attr=ParamAttr(regularizer=L2Decay(0.0)),
														
 
															             bias_attr=ParamAttr(regularizer=L2Decay(0.0)))
														
 
															         self.hardswish = nn.Hardswish()
														
--- a/paddlex/ppdet/modeling/backbones/lite_hrnet.py
+++ b/paddlex/ppdet/modeling/backbones/lite_hrnet.py
@@ -56,11 +56,11 @@ class ConvNormLayer(nn.Layer):
 
															                 regularizer=L2Decay(norm_decay), )
														
 
															             bias_attr = ParamAttr(
														
 
															                 learning_rate=norm_lr, regularizer=L2Decay(norm_decay))
														
 
															-            global_stats = True if freeze_norm else False
														
 
															+            global_stats = True if freeze_norm else None
														
 
															             if norm_type in ['bn', 'sync_bn']:
														
 
															-                self.norm = nn.BatchNorm(
														
 
															+                self.norm = nn.BatchNorm2D(
														
 
															                     ch_out,
														
 
															-                    param_attr=param_attr,
														
 
															+                    weight_attr=param_attr,
														
 
															                     bias_attr=bias_attr,
														
 
															                     use_global_stats=global_stats, )
														
 
															             elif norm_type == 'gn':
														
@@ -582,7 +582,7 @@ class LiteHRNetModule(nn.Layer):
 
															                                 stride=1,
														
 
															                                 padding=0,
														
 
															                                 bias=False, ),
														
 
															-                            nn.BatchNorm(self.in_channels[i]),
														
 
															+                            nn.BatchNorm2D(self.in_channels[i]),
														
 
															                             nn.Upsample(
														
 
															                                 scale_factor=2**(j - i), mode='nearest')))
														
 
															                 elif j == i:
														
@@ -601,7 +601,7 @@ class LiteHRNetModule(nn.Layer):
 
															                                         padding=1,
														
 
															                                         groups=self.in_channels[j],
														
 
															                                         bias=False, ),
														
 
															-                                    nn.BatchNorm(self.in_channels[j]),
														
 
															+                                    nn.BatchNorm2D(self.in_channels[j]),
														
 
															                                     L.Conv2d(
														
 
															                                         self.in_channels[j],
														
 
															                                         self.in_channels[i],
														
@@ -609,7 +609,7 @@ class LiteHRNetModule(nn.Layer):
 
															                                         stride=1,
														
 
															                                         padding=0,
														
 
															                                         bias=False, ),
														
 
															-                                    nn.BatchNorm(self.in_channels[i])))
														
 
															+                                    nn.BatchNorm2D(self.in_channels[i])))
														
 
															                         else:
														
 
															                             conv_downsamples.append(
														
 
															                                 nn.Sequential(
														
@@ -621,7 +621,7 @@ class LiteHRNetModule(nn.Layer):
 
															                                         padding=1,
														
 
															                                         groups=self.in_channels[j],
														
 
															                                         bias=False, ),
														
 
															-                                    nn.BatchNorm(self.in_channels[j]),
														
 
															+                                    nn.BatchNorm2D(self.in_channels[j]),
														
 
															                                     L.Conv2d(
														
 
															                                         self.in_channels[j],
														
 
															                                         self.in_channels[j],
														
@@ -629,7 +629,7 @@ class LiteHRNetModule(nn.Layer):
 
															                                         stride=1,
														
 
															                                         padding=0,
														
 
															                                         bias=False, ),
														
 
															-                                    nn.BatchNorm(self.in_channels[j]),
														
 
															+                                    nn.BatchNorm2D(self.in_channels[j]),
														
 
															                                     nn.ReLU()))
														
 
															                     fuse_layer.append(nn.Sequential(*conv_downsamples))
														
@@ -777,7 +777,7 @@ class LiteHRNet(nn.Layer):
 
															                                 padding=1,
														
 
															                                 groups=num_channels_pre_layer[i],
														
 
															                                 bias=False),
														
 
															-                            nn.BatchNorm(num_channels_pre_layer[i]),
														
 
															+                            nn.BatchNorm2D(num_channels_pre_layer[i]),
														
 
															                             L.Conv2d(
														
 
															                                 num_channels_pre_layer[i],
														
 
															                                 num_channels_cur_layer[i],
														
@@ -785,7 +785,7 @@ class LiteHRNet(nn.Layer):
 
															                                 stride=1,
														
 
															                                 padding=0,
														
 
															                                 bias=False, ),
														
 
															-                            nn.BatchNorm(num_channels_cur_layer[i]),
														
 
															+                            nn.BatchNorm2D(num_channels_cur_layer[i]),
														
 
															                             nn.ReLU()))
														
 
															                 else:
														
 
															                     transition_layers.append(None)
														
@@ -802,7 +802,7 @@ class LiteHRNet(nn.Layer):
 
															                                 stride=2,
														
 
															                                 padding=1,
														
 
															                                 bias=False, ),
														
 
															-                            nn.BatchNorm(num_channels_pre_layer[-1]),
														
 
															+                            nn.BatchNorm2D(num_channels_pre_layer[-1]),
														
 
															                             L.Conv2d(
														
 
															                                 num_channels_pre_layer[-1],
														
 
															                                 num_channels_cur_layer[i]
														
@@ -812,9 +812,9 @@ class LiteHRNet(nn.Layer):
 
															                                 stride=1,
														
 
															                                 padding=0,
														
 
															                                 bias=False, ),
														
 
															-                            nn.BatchNorm(num_channels_cur_layer[i]
														
 
															-                                         if j == i - num_branches_pre else
														
 
															-                                         num_channels_pre_layer[-1]),
														
 
															+                            nn.BatchNorm2D(num_channels_cur_layer[i]
														
 
															+                                           if j == i - num_branches_pre else
														
 
															+                                           num_channels_pre_layer[-1]),
														
 
															                             nn.ReLU()))
														
 
															                 transition_layers.append(nn.Sequential(*conv_downsamples))
														
 
															         return nn.LayerList(transition_layers)
														
--- a/paddlex/ppdet/modeling/backbones/mobilenet_v1.py
+++ b/paddlex/ppdet/modeling/backbones/mobilenet_v1.py
@@ -59,16 +59,9 @@ class ConvBNLayer(nn.Layer):
 
															         param_attr = ParamAttr(regularizer=L2Decay(norm_decay))
														
 
															         bias_attr = ParamAttr(regularizer=L2Decay(norm_decay))
														
 
															-        if norm_type == 'sync_bn':
														
 
															-            self._batch_norm = nn.SyncBatchNorm(
														
 
															+        if norm_type in ['sync_bn', 'bn']:
														
 
															+            self._batch_norm = nn.BatchNorm2D(
														
 
															                 out_channels, weight_attr=param_attr, bias_attr=bias_attr)
														
 
															-        else:
														
 
															-            self._batch_norm = nn.BatchNorm(
														
 
															-                out_channels,
														
 
															-                act=None,
														
 
															-                param_attr=param_attr,
														
 
															-                bias_attr=bias_attr,
														
 
															-                use_global_stats=False)
														
 
															     def forward(self, x):
														
 
															         x = self._conv(x)
														
--- a/paddlex/ppdet/modeling/backbones/mobilenet_v3.py
+++ b/paddlex/ppdet/modeling/backbones/mobilenet_v3.py
@@ -74,15 +74,11 @@ class ConvBNLayer(nn.Layer):
 
															             learning_rate=norm_lr,
														
 
															             regularizer=L2Decay(norm_decay),
														
 
															             trainable=False if freeze_norm else True)
														
 
															-        global_stats = True if freeze_norm else False
														
 
															-        if norm_type == 'sync_bn':
														
 
															-            self.bn = nn.SyncBatchNorm(
														
 
															-                out_c, weight_attr=param_attr, bias_attr=bias_attr)
														
 
															-        else:
														
 
															-            self.bn = nn.BatchNorm(
														
 
															+        global_stats = True if freeze_norm else None
														
 
															+        if norm_type in ['sync_bn', 'bn']:
														
 
															+            self.bn = nn.BatchNorm2D(
														
 
															                 out_c,
														
 
															-                act=None,
														
 
															-                param_attr=param_attr,
														
 
															+                weight_attr=param_attr,
														
 
															                 bias_attr=bias_attr,
														
 
															                 use_global_stats=global_stats)
														
 
															         norm_params = self.bn.parameters()
														
--- a/paddlex/ppdet/modeling/backbones/resnet.py
+++ b/paddlex/ppdet/modeling/backbones/resnet.py
@@ -100,15 +100,11 @@ class ConvNormLayer(nn.Layer):
 
															             regularizer=L2Decay(norm_decay),
														
 
															             trainable=False if freeze_norm else True)
														
 
															-        global_stats = True if freeze_norm else False
														
 
															-        if norm_type == 'sync_bn':
														
 
															-            self.norm = nn.SyncBatchNorm(
														
 
															-                ch_out, weight_attr=param_attr, bias_attr=bias_attr)
														
 
															-        else:
														
 
															-            self.norm = nn.BatchNorm(
														
 
															+        global_stats = True if freeze_norm else None
														
 
															+        if norm_type in ['sync_bn', 'bn']:
														
 
															+            self.norm = nn.BatchNorm2D(
														
 
															                 ch_out,
														
 
															-                act=None,
														
 
															-                param_attr=param_attr,
														
 
															+                weight_attr=param_attr,
														
 
															                 bias_attr=bias_attr,
														
 
															                 use_global_stats=global_stats)
														
 
															         norm_params = self.norm.parameters()
														
--- a/paddlex/ppdet/modeling/backbones/shufflenet_v2.py
+++ b/paddlex/ppdet/modeling/backbones/shufflenet_v2.py
@@ -19,7 +19,8 @@ from __future__ import print_function
 
															 import paddle
														
 
															 import paddle.nn as nn
														
 
															 from paddle import ParamAttr
														
 
															-from paddle.nn import Conv2D, MaxPool2D, AdaptiveAvgPool2D, BatchNorm
														
 
															+import paddle.nn.functional as F
														
 
															+from paddle.nn import Conv2D, MaxPool2D, AdaptiveAvgPool2D, BatchNorm2D
														
 
															 from paddle.nn.initializer import KaimingNormal
														
 
															 from paddle.regularizer import L2Decay
														
@@ -51,15 +52,19 @@ class ConvBNLayer(nn.Layer):
 
															             weight_attr=ParamAttr(initializer=KaimingNormal()),
														
 
															             bias_attr=False)
														
 
															-        self._batch_norm = BatchNorm(
														
 
															+        self._batch_norm = BatchNorm2D(
														
 
															             out_channels,
														
 
															-            param_attr=ParamAttr(regularizer=L2Decay(0.0)),
														
 
															-            bias_attr=ParamAttr(regularizer=L2Decay(0.0)),
														
 
															-            act=act)
														
 
															+            weight_attr=ParamAttr(regularizer=L2Decay(0.0)),
														
 
															+            bias_attr=ParamAttr(regularizer=L2Decay(0.0)))
														
 
															+        if act == "hard_swish":
														
 
															+            act = 'hardswish'
														
 
															+        self.act = act
														
 
															     def forward(self, inputs):
														
 
															         y = self._conv(inputs)
														
 
															         y = self._batch_norm(y)
														
 
															+        if self.act:
														
 
															+            y = getattr(F, self.act)(y)
														
 
															         return y
														
--- a/paddlex/ppdet/modeling/backbones/swin_transformer.py
+++ b/paddlex/ppdet/modeling/backbones/swin_transformer.py
@@ -493,8 +493,13 @@ class BasicLayer(nn.Layer):
 
															         cnt = 0
														
 
															         for h in h_slices:
														
 
															             for w in w_slices:
														
 
															-                img_mask[:, h, w, :] = cnt
														
 
															+                try:
														
 
															+                    img_mask[:, h, w, :] = cnt
														
 
															+                except:
														
 
															+                    pass
														
 
															+
														
 
															                 cnt += 1
														
 
															+
														
 
															         mask_windows = window_partition(
														
 
															             img_mask, self.window_size)  # nW, window_size, window_size, 1
														
 
															         mask_windows = mask_windows.reshape(
														
--- a/paddlex/ppdet/modeling/layers.py
+++ b/paddlex/ppdet/modeling/layers.py
@@ -176,12 +176,9 @@ class ConvNormLayer(nn.Layer):
 
															             learning_rate=norm_lr,
														
 
															             regularizer=L2Decay(norm_decay)
														
 
															             if norm_decay is not None else None)
														
 
															-        if norm_type == 'bn':
														
 
															+        if norm_type in ['bn', 'sync_bn']:
														
 
															             self.norm = nn.BatchNorm2D(
														
 
															                 ch_out, weight_attr=param_attr, bias_attr=bias_attr)
														
 
															-        elif norm_type == 'sync_bn':
														
 
															-            self.norm = nn.SyncBatchNorm(
														
 
															-                ch_out, weight_attr=param_attr, bias_attr=bias_attr)
														
 
															         elif norm_type == 'gn':
														
 
															             self.norm = nn.GroupNorm(
														
 
															                 num_groups=norm_groups,
														
--- a/paddlex/ppdet/modeling/mot/tracker/base_jde_tracker.py
+++ b/paddlex/ppdet/modeling/mot/tracker/base_jde_tracker.py
@@ -102,31 +102,26 @@ class BaseTrack(object):
 
															 @register
														
 
															 @serializable
														
 
															 class STrack(BaseTrack):
														
 
															-    def __init__(self,
														
 
															-                 tlwh,
														
 
															-                 score,
														
 
															-                 temp_feat,
														
 
															-                 num_classes,
														
 
															-                 cls_id,
														
 
															-                 buff_size=30):
														
 
															-        # object class id
														
 
															-        self.cls_id = cls_id
														
 
															+    def __init__(self, tlwh, score, cls_id, buff_size=30, temp_feat=None):
														
 
															         # wait activate
														
 
															         self._tlwh = np.asarray(tlwh, dtype=np.float)
														
 
															+        self.score = score
														
 
															+        self.cls_id = cls_id
														
 
															+        self.track_len = 0
														
 
															+
														
 
															         self.kalman_filter = None
														
 
															         self.mean, self.covariance = None, None
														
 
															         self.is_activated = False
														
 
															-        self.score = score
														
 
															-        self.track_len = 0
														
 
															-
														
 
															-        self.smooth_feat = None
														
 
															-        self.update_features(temp_feat)
														
 
															-        self.features = deque([], maxlen=buff_size)
														
 
															-        self.alpha = 0.9
														
 
															+        self.use_reid = True if temp_feat is not None else False
														
 
															+        if self.use_reid:
														
 
															+            self.smooth_feat = None
														
 
															+            self.update_features(temp_feat)
														
 
															+            self.features = deque([], maxlen=buff_size)
														
 
															+            self.alpha = 0.9
														
 
															     def update_features(self, feat):
														
 
															-        # L2 normalizing
														
 
															+        # L2 normalizing, this function has no use for BYTETracker
														
 
															         feat /= np.linalg.norm(feat)
														
 
															         self.curr_feat = feat
														
 
															         if self.smooth_feat is None:
														
@@ -182,7 +177,8 @@ class STrack(BaseTrack):
 
															     def re_activate(self, new_track, frame_id, new_id=False):
														
 
															         self.mean, self.covariance = self.kalman_filter.update(
														
 
															             self.mean, self.covariance, self.tlwh_to_xyah(new_track.tlwh))
														
 
															-        self.update_features(new_track.curr_feat)
														
 
															+        if self.use_reid:
														
 
															+            self.update_features(new_track.curr_feat)
														
 
															         self.track_len = 0
														
 
															         self.state = TrackState.Tracked
														
 
															         self.is_activated = True
														
@@ -201,7 +197,7 @@ class STrack(BaseTrack):
 
															         self.is_activated = True  # set flag 'activated'
														
 
															         self.score = new_track.score
														
 
															-        if update_feature:
														
 
															+        if update_feature and self.use_reid:
														
 
															             self.update_features(new_track.curr_feat)
														
 
															     @property
														
--- a/paddlex/ppdet/modeling/mot/tracker/jde_tracker.py
+++ b/paddlex/ppdet/modeling/mot/tracker/jde_tracker.py
@@ -58,6 +58,7 @@ class JDETracker(object):
 
															     """

														
 
															     def __init__(self,

														
 
															+                 use_byte=False,

														
 
															                  num_classes=1,

														
 
															                  det_thresh=0.3,

														
 
															                  track_buffer=30,

														
@@ -66,11 +67,14 @@ class JDETracker(object):
 
															                  tracked_thresh=0.7,

														
 
															                  r_tracked_thresh=0.5,

														
 
															                  unconfirmed_thresh=0.7,

														
 
															-                 motion='KalmanFilter',

														
 
															                  conf_thres=0,

														
 
															+                 match_thres=0.8,

														
 
															+                 low_conf_thres=0.2,

														
 
															+                 motion='KalmanFilter',

														
 
															                  metric_type='euclidean'):

														
 
															+        self.use_byte = use_byte

														
 
															         self.num_classes = num_classes

														
 
															-        self.det_thresh = det_thresh

														
 
															+        self.det_thresh = det_thresh if not use_byte else conf_thres + 0.1

														
 
															         self.track_buffer = track_buffer

														
 
															         self.min_box_area = min_box_area

														
 
															         self.vertical_ratio = vertical_ratio

														
@@ -78,9 +82,12 @@ class JDETracker(object):
 
															         self.tracked_thresh = tracked_thresh

														
 
															         self.r_tracked_thresh = r_tracked_thresh

														
 
															         self.unconfirmed_thresh = unconfirmed_thresh

														
 
															+        self.conf_thres = conf_thres

														
 
															+        self.match_thres = match_thres

														
 
															+        self.low_conf_thres = low_conf_thres

														
 
															+

														
 
															         if motion == 'KalmanFilter':

														
 
															             self.motion = KalmanFilter()

														
 
															-        self.conf_thres = conf_thres

														
 
															         self.metric_type = metric_type

														
 
															         self.frame_id = 0

														
@@ -91,7 +98,7 @@ class JDETracker(object):
 
															         self.max_time_lost = 0

														
 
															         # max_time_lost will be calculated: int(frame_rate / 30.0 * track_buffer)

														
 
															-    def update(self, pred_dets, pred_embs):

														
 
															+    def update(self, pred_dets, pred_embs=None):

														
 
															         """

														
 
															         Processes the image frame and finds bounding box(detections).

														
 
															         Associates the detection with corresponding tracklets and also handles

														
@@ -123,7 +130,10 @@ class JDETracker(object):
 
															         for cls_id in range(self.num_classes):

														
 
															             cls_idx = (pred_dets[:, 5:] == cls_id).squeeze(-1)

														
 
															             pred_dets_dict[cls_id] = pred_dets[cls_idx]

														
 
															-            pred_embs_dict[cls_id] = pred_embs[cls_idx]

														
 
															+            if pred_embs is not None:

														
 
															+                pred_embs_dict[cls_id] = pred_embs[cls_idx]

														
 
															+            else:

														
 
															+                pred_embs_dict[cls_id] = None

														
 
															         for cls_id in range(self.num_classes):

														
 
															             """ Step 1: Get detections by class"""

														
@@ -132,13 +142,24 @@ class JDETracker(object):
 
															             remain_inds = (pred_dets_cls[:, 4:5] > self.conf_thres).squeeze(-1)

														
 
															             if remain_inds.sum() > 0:

														
 
															                 pred_dets_cls = pred_dets_cls[remain_inds]

														
 
															-                pred_embs_cls = pred_embs_cls[remain_inds]

														
 
															-                detections = [

														
 
															-                    STrack(

														
 
															-                        STrack.tlbr_to_tlwh(tlbrs[:4]), tlbrs[4], f,

														
 
															-                        self.num_classes, cls_id, 30)

														
 
															-                    for (tlbrs, f) in zip(pred_dets_cls, pred_embs_cls)

														
 
															-                ]

														
 
															+                if self.use_byte:

														
 
															+                    detections = [

														
 
															+                        STrack(

														
 
															+                            STrack.tlbr_to_tlwh(tlbrs[:4]),

														
 
															+                            tlbrs[4],

														
 
															+                            cls_id,

														
 
															+                            30,

														
 
															+                            temp_feat=None) for tlbrs in pred_dets_cls

														
 
															+                    ]

														
 
															+                else:

														
 
															+                    pred_embs_cls = pred_embs_cls[remain_inds]

														
 
															+                    detections = [

														
 
															+                        STrack(

														
 
															+                            STrack.tlbr_to_tlwh(tlbrs[:4]), tlbrs[4], cls_id,

														
 
															+                            30, temp_feat)

														
 
															+                        for (tlbrs, temp_feat

														
 
															+                             ) in zip(pred_dets_cls, pred_embs_cls)

														
 
															+                    ]

														
 
															             else:

														
 
															                 detections = []

														
 
															             ''' Add newly detected tracklets to tracked_stracks'''

														
@@ -160,12 +181,20 @@ class JDETracker(object):
 
															             # Predict the current location with KalmanFilter

														
 
															             STrack.multi_predict(track_pool_dict[cls_id], self.motion)

														
 
															-            dists = matching.embedding_distance(

														
 
															-                track_pool_dict[cls_id], detections, metric=self.metric_type)

														
 
															-            dists = matching.fuse_motion(self.motion, dists,

														
 
															-                                         track_pool_dict[cls_id], detections)

														
 
															-            matches, u_track, u_detection = matching.linear_assignment(

														
 
															-                dists, thresh=self.tracked_thresh)

														
 
															+            if self.use_byte:

														
 
															+                dists = matching.iou_distance(track_pool_dict[cls_id],

														
 
															+                                              detections)

														
 
															+                matches, u_track, u_detection = matching.linear_assignment(

														
 
															+                    dists, thresh=self.match_thres)  #

														
 
															+            else:

														
 
															+                dists = matching.embedding_distance(

														
 
															+                    track_pool_dict[cls_id],

														
 
															+                    detections,

														
 
															+                    metric=self.metric_type)

														
 
															+                dists = matching.fuse_motion(

														
 
															+                    self.motion, dists, track_pool_dict[cls_id], detections)

														
 
															+                matches, u_track, u_detection = matching.linear_assignment(

														
 
															+                    dists, thresh=self.tracked_thresh)

														
 
															             for i_tracked, idet in matches:

														
 
															                 # i_tracked is the id of the track and idet is the detection

														
@@ -183,19 +212,48 @@ class JDETracker(object):
 
															             # None of the steps below happen if there are no undetected tracks.

														
 
															             """ Step 3: Second association, with IOU"""

														
 
															-            detections = [detections[i] for i in u_detection]

														
 
															-            r_tracked_stracks = []

														
 
															-            for i in u_track:

														
 
															-                if track_pool_dict[cls_id][i].state == TrackState.Tracked:

														
 
															-                    r_tracked_stracks.append(track_pool_dict[cls_id][i])

														
 
															+            if self.use_byte:

														
 
															+                inds_low = pred_dets_dict[cls_id][:, 4:5] > self.low_conf_thres

														
 
															+                inds_high = pred_dets_dict[cls_id][:, 4:5] < self.conf_thres

														
 
															+                inds_second = np.logical_and(inds_low, inds_high).squeeze(-1)

														
 
															+                pred_dets_cls_second = pred_dets_dict[cls_id][inds_second]

														
 
															-            dists = matching.iou_distance(r_tracked_stracks, detections)

														
 
															-            matches, u_track, u_detection = matching.linear_assignment(

														
 
															-                dists, thresh=self.r_tracked_thresh)

														
 
															+                # association the untrack to the low score detections

														
 
															+                if len(pred_dets_cls_second) > 0:

														
 
															+                    detections_second = [

														
 
															+                        STrack(

														
 
															+                            STrack.tlbr_to_tlwh(tlbrs[:4]),

														
 
															+                            tlbrs[4],

														
 
															+                            cls_id,

														
 
															+                            30,

														
 
															+                            temp_feat=None)

														
 
															+                        for tlbrs in pred_dets_cls_second[:, :5]

														
 
															+                    ]

														
 
															+                else:

														
 
															+                    detections_second = []

														
 
															+                r_tracked_stracks = [

														
 
															+                    track_pool_dict[cls_id][i] for i in u_track

														
 
															+                    if track_pool_dict[cls_id][i].state == TrackState.Tracked

														
 
															+                ]

														
 
															+                dists = matching.iou_distance(r_tracked_stracks,

														
 
															+                                              detections_second)

														
 
															+                matches, u_track, u_detection_second = matching.linear_assignment(

														
 
															+                    dists, thresh=0.4)  # not r_tracked_thresh

														
 
															+            else:

														
 
															+                detections = [detections[i] for i in u_detection]

														
 
															+                r_tracked_stracks = []

														
 
															+                for i in u_track:

														
 
															+                    if track_pool_dict[cls_id][i].state == TrackState.Tracked:

														
 
															+                        r_tracked_stracks.append(track_pool_dict[cls_id][i])

														
 
															+                dists = matching.iou_distance(r_tracked_stracks, detections)

														
 
															+

														
 
															+                matches, u_track, u_detection = matching.linear_assignment(

														
 
															+                    dists, thresh=self.r_tracked_thresh)

														
 
															             for i_tracked, idet in matches:

														
 
															                 track = r_tracked_stracks[i_tracked]

														
 
															-                det = detections[idet]

														
 
															+                det = detections[

														
 
															+                    idet] if not self.use_byte else detections_second[idet]

														
 
															                 if track.state == TrackState.Tracked:

														
 
															                     track.update(det, self.frame_id)

														
 
															                     activated_tracks_dict[cls_id].append(track)

														
--- a/paddlex/ppdet/modeling/necks/bifpn.py
+++ b/paddlex/ppdet/modeling/necks/bifpn.py
@@ -52,10 +52,8 @@ class SeparableConvLayer(nn.Layer):
 
															         self.pointwise_conv = nn.Conv2D(in_channels, self.out_channels, 1)
														
 
															         # norm type
														
 
															-        if self.norm_type == 'bn':
														
 
															+        if self.norm_type in ['bn', 'sync_bn']:
														
 
															             self.norm = nn.BatchNorm2D(self.out_channels)
														
 
															-        elif self.norm_type == 'sync_bn':
														
 
															-            self.norm = nn.SyncBatchNorm(self.out_channels)
														
 
															         elif self.norm_type == 'gn':
														
 
															             self.norm = nn.GroupNorm(
														
 
															                 num_groups=self.norm_groups, num_channels=self.out_channels)
														
--- a/paddlex/ppdet/modeling/necks/blazeface_fpn.py
+++ b/paddlex/ppdet/modeling/necks/blazeface_fpn.py
@@ -54,11 +54,8 @@ class ConvBNLayer(nn.Layer):
 
															                 learning_rate=conv_lr, initializer=KaimingNormal()),
														
 
															             bias_attr=False)
														
 
															-        if norm_type == 'sync_bn':
														
 
															-            self._batch_norm = nn.SyncBatchNorm(out_channels)
														
 
															-        else:
														
 
															-            self._batch_norm = nn.BatchNorm(
														
 
															-                out_channels, act=None, use_global_stats=False)
														
 
															+        if norm_type in ['sync_bn', 'bn']:
														
 
															+            self._batch_norm = nn.BatchNorm2D(out_channels)
														
 
															     def forward(self, x):
														
 
															         x = self._conv(x)
														
--- a/paddlex/ppdet/modeling/necks/pan.py
+++ b/paddlex/ppdet/modeling/necks/pan.py
@@ -1,135 +0,0 @@
 
															-# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
														
 
															-#
														
 
															-# Licensed under the Apache License, Version 2.0 (the "License");
														
 
															-# you may not use this file except in compliance with the License.
														
 
															-# You may obtain a copy of the License at
														
 
															-#
														
 
															-#     http://www.apache.org/licenses/LICENSE-2.0
														
 
															-#
														
 
															-# Unless required by applicable law or agreed to in writing, software
														
 
															-# distributed under the License is distributed on an "AS IS" BASIS,
														
 
															-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															-# See the License for the specific language governing permissions and
														
 
															-# limitations under the License.
														
 
															-
														
 
															-import numpy as np
														
 
															-import paddle
														
 
															-import paddle.nn as nn
														
 
															-import paddle.nn.functional as F
														
 
															-from paddle import ParamAttr
														
 
															-from paddle.nn.initializer import XavierUniform
														
 
															-from paddle.regularizer import L2Decay
														
 
															-from paddlex.ppdet.core.workspace import register, serializable
														
 
															-from paddlex.ppdet.modeling.layers import ConvNormLayer
														
 
															-from ..shape_spec import ShapeSpec
														
 
															-
														
 
															-__all__ = ['PAN']
														
 
															-
														
 
															-
														
 
															-@register
														
 
															-@serializable
														
 
															-class PAN(nn.Layer):
														
 
															-    """
														
 
															-    Path Aggregation Network, see https://arxiv.org/abs/1803.01534
														
 
															-
														
 
															-    Args:
														
 
															-        in_channels (list[int]): input channels of each level which can be
														
 
															-            derived from the output shape of backbone by from_config
														
 
															-        out_channel (list[int]): output channel of each level
														
 
															-        spatial_scales (list[float]): the spatial scales between input feature
														
 
															-            maps and original input image which can be derived from the output
														
 
															-            shape of backbone by from_config
														
 
															-        has_extra_convs (bool): whether to add extra conv to the last level.
														
 
															-            default False
														
 
															-        extra_stage (int): the number of extra stages added to the last level.
														
 
															-            default 1
														
 
															-        use_c5 (bool): Whether to use c5 as the input of extra stage,
														
 
															-            otherwise p5 is used. default True
														
 
															-        norm_type (string|None): The normalization type in FPN module. If
														
 
															-            norm_type is None, norm will not be used after conv and if
														
 
															-            norm_type is string, bn, gn, sync_bn are available. default None
														
 
															-        norm_decay (float): weight decay for normalization layer weights.
														
 
															-            default 0.
														
 
															-        freeze_norm (bool): whether to freeze normalization layer.
														
 
															-            default False
														
 
															-        relu_before_extra_convs (bool): whether to add relu before extra convs.
														
 
															-            default False
														
 
															-    """
														
 
															-
														
 
															-    def __init__(self,
														
 
															-                 in_channels,
														
 
															-                 out_channel,
														
 
															-                 spatial_scales=[0.125, 0.0625, 0.03125],
														
 
															-                 start_level=0,
														
 
															-                 end_level=-1,
														
 
															-                 norm_type=None):
														
 
															-        super(PAN, self).__init__()
														
 
															-        self.out_channel = out_channel
														
 
															-        self.num_ins = len(in_channels)
														
 
															-        self.spatial_scales = spatial_scales
														
 
															-        if end_level == -1:
														
 
															-            self.end_level = self.num_ins
														
 
															-        else:
														
 
															-            # if end_level < inputs, no extra level is allowed
														
 
															-            self.end_level = end_level
														
 
															-            assert end_level <= len(in_channels)
														
 
															-        self.start_level = start_level
														
 
															-        self.norm_type = norm_type
														
 
															-        self.lateral_convs = []
														
 
															-
														
 
															-        for i in range(self.start_level, self.end_level):
														
 
															-            in_c = in_channels[i - self.start_level]
														
 
															-            if self.norm_type is not None:
														
 
															-                lateral = self.add_sublayer(
														
 
															-                    'pan_lateral' + str(i),
														
 
															-                    ConvNormLayer(
														
 
															-                        ch_in=in_c,
														
 
															-                        ch_out=self.out_channel,
														
 
															-                        filter_size=1,
														
 
															-                        stride=1,
														
 
															-                        norm_type=self.norm_type,
														
 
															-                        norm_decay=self.norm_decay,
														
 
															-                        freeze_norm=self.freeze_norm,
														
 
															-                        initializer=XavierUniform(fan_out=in_c)))
														
 
															-            else:
														
 
															-                lateral = self.add_sublayer(
														
 
															-                    'pan_lateral' + str(i),
														
 
															-                    nn.Conv2D(
														
 
															-                        in_channels=in_c,
														
 
															-                        out_channels=self.out_channel,
														
 
															-                        kernel_size=1,
														
 
															-                        weight_attr=ParamAttr(
														
 
															-                            initializer=XavierUniform(fan_out=in_c))))
														
 
															-            self.lateral_convs.append(lateral)
														
 
															-
														
 
															-    @classmethod
														
 
															-    def from_config(cls, cfg, input_shape):
														
 
															-        return {'in_channels': [i.channels for i in input_shape], }
														
 
															-
														
 
															-    def forward(self, body_feats):
														
 
															-        laterals = []
														
 
															-        for i, lateral_conv in enumerate(self.lateral_convs):
														
 
															-            laterals.append(lateral_conv(body_feats[i + self.start_level]))
														
 
															-        num_levels = len(laterals)
														
 
															-        for i in range(1, num_levels):
														
 
															-            lvl = num_levels - i
														
 
															-            upsample = F.interpolate(
														
 
															-                laterals[lvl],
														
 
															-                scale_factor=2.,
														
 
															-                mode='bilinear', )
														
 
															-            laterals[lvl - 1] += upsample
														
 
															-
														
 
															-        outs = [laterals[i] for i in range(num_levels)]
														
 
															-        for i in range(0, num_levels - 1):
														
 
															-            outs[i + 1] += F.interpolate(
														
 
															-                outs[i], scale_factor=0.5, mode='bilinear')
														
 
															-
														
 
															-        return outs
														
 
															-
														
 
															-    @property
														
 
															-    def out_shape(self):
														
 
															-        return [
														
 
															-            ShapeSpec(
														
 
															-                channels=self.out_channel, stride=1. / s)
														
 
															-            for s in self.spatial_scales
														
 
															-        ]
														
--- a/paddlex/ppdet/modeling/ops.py
+++ b/paddlex/ppdet/modeling/ops.py
@@ -50,10 +50,6 @@ def batch_norm(ch,
 
															                freeze_norm=False,
														
 
															                initializer=None,
														
 
															                data_format='NCHW'):
														
 
															-    if norm_type == 'sync_bn':
														
 
															-        batch_norm = nn.SyncBatchNorm
														
 
															-    else:
														
 
															-        batch_norm = nn.BatchNorm2D
														
 
															     norm_lr = 0. if freeze_norm else 1.
														
 
															     weight_attr = ParamAttr(
														
@@ -66,11 +62,12 @@ def batch_norm(ch,
 
															         regularizer=L2Decay(norm_decay),
														
 
															         trainable=False if freeze_norm else True)
														
 
															-    norm_layer = batch_norm(
														
 
															-        ch,
														
 
															-        weight_attr=weight_attr,
														
 
															-        bias_attr=bias_attr,
														
 
															-        data_format=data_format)
														
 
															+    if norm_type in ['sync_bn', 'bn']:
														
 
															+        norm_layer = nn.BatchNorm2D(
														
 
															+            ch,
														
 
															+            weight_attr=weight_attr,
														
 
															+            bias_attr=bias_attr,
														
 
															+            data_format=data_format)
														
 
															     norm_params = norm_layer.parameters()
														
 
															     if freeze_norm:
														
--- a/paddlex/ppdet/modeling/post_process.py
+++ b/paddlex/ppdet/modeling/post_process.py
@@ -42,10 +42,6 @@ class BBoxPostProcess(nn.Layer):
 
															         self.num_classes = num_classes
														
 
															         self.decode = decode
														
 
															         self.nms = nms
														
 
															-        self.fake_bboxes = paddle.to_tensor(
														
 
															-            np.array(
														
 
															-                [[-1, 0.0, 0.0, 0.0, 0.0, 0.0]], dtype='float32'))
														
 
															-        self.fake_bbox_num = paddle.to_tensor(np.array([1], dtype='int32'))
														
 
															     def forward(self, head_out, rois, im_shape, scale_factor):
														
 
															         """
														
@@ -91,9 +87,28 @@ class BBoxPostProcess(nn.Layer):
 
															                 including labels, scores and bboxes.
														
 
															         """
														
 
															-        if bboxes.shape[0] == 0:
														
 
															-            bboxes = self.fake_bboxes
														
 
															-            bbox_num = self.fake_bbox_num
														
 
															+        bboxes_list = []
														
 
															+        bbox_num_list = []
														
 
															+        id_start = 0
														
 
															+        fake_bboxes = paddle.to_tensor(
														
 
															+            np.array(
														
 
															+                [[-1, 0.0, 0.0, 0.0, 0.0, 0.0]], dtype='float32'))
														
 
															+        fake_bbox_num = paddle.to_tensor(np.array([1], dtype='int32'))
														
 
															+
														
 
															+        # add fake bbox when output is empty for each batch
														
 
															+        for i in range(bbox_num.shape[0]):
														
 
															+            if bbox_num[i] == 0:
														
 
															+                bboxes_i = fake_bboxes
														
 
															+                bbox_num_i = fake_bbox_num
														
 
															+                id_start += 1
														
 
															+            else:
														
 
															+                bboxes_i = bboxes[id_start:id_start + bbox_num[i], :]
														
 
															+                bbox_num_i = bbox_num[i]
														
 
															+                id_start += bbox_num[i]
														
 
															+            bboxes_list.append(bboxes_i)
														
 
															+            bbox_num_list.append(bbox_num_i)
														
 
															+        bboxes = paddle.concat(bboxes_list)
														
 
															+        bbox_num = paddle.concat(bbox_num_list)
														
 
															         origin_shape = paddle.floor(im_shape / scale_factor + 0.5)
														
@@ -157,6 +172,7 @@ class MaskPostProcess(object):
 
															         """
														
 
															         Paste the mask prediction to the original image.
														
 
															         """
														
 
															+
														
 
															         x0, y0, x1, y1 = paddle.split(boxes, 4, axis=1)
														
 
															         masks = paddle.unsqueeze(masks, [0, 1])
														
 
															         img_y = paddle.arange(0, im_h, dtype='float32') + 0.5
														
--- a/paddlex/ppdet/modeling/proposal_generator/target.py
+++ b/paddlex/ppdet/modeling/proposal_generator/target.py
@@ -52,8 +52,8 @@ def rpn_anchor_target(anchors,
 
															             labels = paddle.scatter(labels, fg_inds, paddle.ones_like(fg_inds))
														
 
															         # Step3: make output
														
 
															         if gt_bbox.shape[0] == 0:
														
 
															-            matched_gt_boxes = paddle.zeros([0, 4])
														
 
															-            tgt_delta = paddle.zeros([0, 4])
														
 
															+            matched_gt_boxes = paddle.zeros([matches.shape[0], 4])
														
 
															+            tgt_delta = paddle.zeros([matches.shape[0], 4])
														
 
															         else:
														
 
															             matched_gt_boxes = paddle.gather(gt_bbox, matches)
														
 
															             tgt_delta = bbox2delta(anchors, matched_gt_boxes, weights)
														
--- a/paddlex/ppdet/modeling/reid/pplcnet_embedding.py
+++ b/paddlex/ppdet/modeling/reid/pplcnet_embedding.py
@@ -21,7 +21,7 @@ import paddle.nn as nn
 
															 import paddle.nn.functional as F
														
 
															 from paddle.nn.initializer import Normal, Constant
														
 
															 from paddle import ParamAttr
														
 
															-from paddle.nn import AdaptiveAvgPool2D, BatchNorm, Conv2D, Linear
														
 
															+from paddle.nn import AdaptiveAvgPool2D, BatchNorm2D, Conv2D, Linear
														
 
															 from paddle.regularizer import L2Decay
														
 
															 from paddle.nn.initializer import KaimingNormal, XavierNormal
														
 
															 from paddlex.ppdet.core.workspace import register
														
@@ -76,9 +76,9 @@ class ConvBNLayer(nn.Layer):
 
															             weight_attr=ParamAttr(initializer=KaimingNormal()),
														
 
															             bias_attr=False)
														
 
															-        self.bn = BatchNorm(
														
 
															+        self.bn = BatchNorm2D(
														
 
															             num_filters,
														
 
															-            param_attr=ParamAttr(regularizer=L2Decay(0.0)),
														
 
															+            weight_attr=ParamAttr(regularizer=L2Decay(0.0)),
														
 
															             bias_attr=ParamAttr(regularizer=L2Decay(0.0)))
														
 
															         self.hardswish = nn.Hardswish()
														
--- a/paddlex/ppdet/modeling/reid/resnet.py
+++ b/paddlex/ppdet/modeling/reid/resnet.py
@@ -55,12 +55,14 @@ class ConvBNLayer(nn.Layer):
 
															             bias_attr=False,
														
 
															             data_format=data_format)
														
 
															-        self._batch_norm = nn.BatchNorm(
														
 
															-            num_filters, act=act, data_layout=data_format)
														
 
															+        self._batch_norm = nn.BatchNorm2D(num_filters, data_layout=data_format)
														
 
															+        self.act = act
														
 
															     def forward(self, inputs):
														
 
															         y = self._conv(inputs)
														
 
															         y = self._batch_norm(y)
														
 
															+        if self.act:
														
 
															+            y = getattr(F, self.act)(y)
														
 
															         return y
														
--- a/paddlex/ppdet/modeling/tests/__init__.py
+++ b/paddlex/ppdet/modeling/tests/__init__.py
@@ -1,13 +0,0 @@
 
															-#   Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
														
 
															-#
														
 
															-# Licensed under the Apache License, Version 2.0 (the "License");
														
 
															-# you may not use this file except in compliance with the License.
														
 
															-# You may obtain a copy of the License at
														
 
															-#
														
 
															-#     http://www.apache.org/licenses/LICENSE-2.0
														
 
															-#
														
 
															-# Unless required by applicable law or agreed to in writing, software
														
 
															-# distributed under the License is distributed on an "AS IS" BASIS,
														
 
															-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															-# See the License for the specific language governing permissions and
														
 
															-# limitations under the License.
														
--- a/paddlex/ppdet/modeling/tests/imgs/coco2017_val2017_000000000139.jpg
+++ b/paddlex/ppdet/modeling/tests/imgs/coco2017_val2017_000000000139.jpg
--- a/paddlex/ppdet/modeling/tests/imgs/coco2017_val2017_000000000724.jpg
+++ b/paddlex/ppdet/modeling/tests/imgs/coco2017_val2017_000000000724.jpg
--- a/paddlex/ppdet/modeling/tests/test_architectures.py
+++ b/paddlex/ppdet/modeling/tests/test_architectures.py
@@ -1,69 +0,0 @@
 
															-#   Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
														
 
															-#
														
 
															-# Licensed under the Apache License, Version 2.0 (the "License");
														
 
															-# you may not use this file except in compliance with the License.
														
 
															-# You may obtain a copy of the License at
														
 
															-#
														
 
															-#     http://www.apache.org/licenses/LICENSE-2.0
														
 
															-#
														
 
															-# Unless required by applicable law or agreed to in writing, software
														
 
															-# distributed under the License is distributed on an "AS IS" BASIS,
														
 
															-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															-# See the License for the specific language governing permissions and
														
 
															-# limitations under the License.
														
 
															-
														
 
															-from __future__ import absolute_import
														
 
															-from __future__ import division
														
 
															-from __future__ import print_function
														
 
															-
														
 
															-import unittest
														
 
															-import paddlex.ppdet
														
 
															-
														
 
															-
														
 
															-class TestFasterRCNN(unittest.TestCase):
														
 
															-    def setUp(self):
														
 
															-        self.set_config()
														
 
															-
														
 
															-    def set_config(self):
														
 
															-        self.cfg_file = 'configs/faster_rcnn/faster_rcnn_r50_fpn_1x_coco.yml'
														
 
															-
														
 
															-    def test_trainer(self):
														
 
															-        # Trainer __init__ will build model and DataLoader
														
 
															-        # 'train' and 'eval' mode include dataset loading
														
 
															-        # use 'test' mode to simplify tests
														
 
															-        cfg = ppdet.core.workspace.load_config(self.cfg_file)
														
 
															-        trainer = ppdet.engine.Trainer(cfg, mode='test')
														
 
															-
														
 
															-
														
 
															-class TestMaskRCNN(TestFasterRCNN):
														
 
															-    def set_config(self):
														
 
															-        self.cfg_file = 'configs/mask_rcnn/mask_rcnn_r50_fpn_1x_coco.yml'
														
 
															-
														
 
															-
														
 
															-class TestCascadeRCNN(TestFasterRCNN):
														
 
															-    def set_config(self):
														
 
															-        self.cfg_file = 'configs/cascade_rcnn/cascade_rcnn_r50_fpn_1x_coco.yml'
														
 
															-
														
 
															-
														
 
															-class TestYolov3(TestFasterRCNN):
														
 
															-    def set_config(self):
														
 
															-        self.cfg_file = 'configs/yolov3/yolov3_darknet53_270e_coco.yml'
														
 
															-
														
 
															-
														
 
															-class TestSSD(TestFasterRCNN):
														
 
															-    def set_config(self):
														
 
															-        self.cfg_file = 'configs/ssd/ssd_vgg16_300_240e_voc.yml'
														
 
															-
														
 
															-
														
 
															-class TestGFL(TestFasterRCNN):
														
 
															-    def set_config(self):
														
 
															-        self.cfg_file = 'configs/gfl/gfl_r50_fpn_1x_coco.yml'
														
 
															-
														
 
															-
														
 
															-class TestPicoDet(TestFasterRCNN):
														
 
															-    def set_config(self):
														
 
															-        self.cfg_file = 'configs/picodet/picodet_s_320_coco.yml'
														
 
															-
														
 
															-
														
 
															-if __name__ == '__main__':
														
 
															-    unittest.main()
														
--- a/paddlex/ppdet/modeling/tests/test_base.py
+++ b/paddlex/ppdet/modeling/tests/test_base.py
@@ -1,74 +0,0 @@
 
															-#   Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
														
 
															-#
														
 
															-# Licensed under the Apache License, Version 2.0 (the "License");
														
 
															-# you may not use this file except in compliance with the License.
														
 
															-# You may obtain a copy of the License at
														
 
															-#
														
 
															-#     http://www.apache.org/licenses/LICENSE-2.0
														
 
															-#
														
 
															-# Unless required by applicable law or agreed to in writing, software
														
 
															-# distributed under the License is distributed on an "AS IS" BASIS,
														
 
															-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															-# See the License for the specific language governing permissions and
														
 
															-# limitations under the License.
														
 
															-
														
 
															-from __future__ import print_function
														
 
															-import unittest
														
 
															-
														
 
															-import contextlib
														
 
															-
														
 
															-import paddle
														
 
															-import paddle.fluid as fluid
														
 
															-from paddle.fluid.framework import Program
														
 
															-from paddle.fluid import core
														
 
															-
														
 
															-
														
 
															-class LayerTest(unittest.TestCase):
														
 
															-    @classmethod
														
 
															-    def setUpClass(cls):
														
 
															-        cls.seed = 111
														
 
															-
														
 
															-    @classmethod
														
 
															-    def tearDownClass(cls):
														
 
															-        pass
														
 
															-
														
 
															-    def _get_place(self, force_to_use_cpu=False):
														
 
															-        # this option for ops that only have cpu kernel
														
 
															-        if force_to_use_cpu:
														
 
															-            return core.CPUPlace()
														
 
															-        else:
														
 
															-            if core.is_compiled_with_cuda():
														
 
															-                return core.CUDAPlace(0)
														
 
															-            return core.CPUPlace()
														
 
															-
														
 
															-    @contextlib.contextmanager
														
 
															-    def static_graph(self):
														
 
															-        paddle.enable_static()
														
 
															-        scope = fluid.core.Scope()
														
 
															-        program = Program()
														
 
															-        with fluid.scope_guard(scope):
														
 
															-            with fluid.program_guard(program):
														
 
															-                paddle.seed(self.seed)
														
 
															-                paddle.framework.random._manual_program_seed(self.seed)
														
 
															-                yield
														
 
															-
														
 
															-    def get_static_graph_result(self,
														
 
															-                                feed,
														
 
															-                                fetch_list,
														
 
															-                                with_lod=False,
														
 
															-                                force_to_use_cpu=False):
														
 
															-        exe = fluid.Executor(self._get_place(force_to_use_cpu))
														
 
															-        exe.run(fluid.default_startup_program())
														
 
															-        return exe.run(fluid.default_main_program(),
														
 
															-                       feed=feed,
														
 
															-                       fetch_list=fetch_list,
														
 
															-                       return_numpy=(not with_lod))
														
 
															-
														
 
															-    @contextlib.contextmanager
														
 
															-    def dynamic_graph(self, force_to_use_cpu=False):
														
 
															-        paddle.disable_static()
														
 
															-        with fluid.dygraph.guard(
														
 
															-                self._get_place(force_to_use_cpu=force_to_use_cpu)):
														
 
															-            paddle.seed(self.seed)
														
 
															-            paddle.framework.random._manual_program_seed(self.seed)
														
 
															-            yield
														
--- a/paddlex/ppdet/modeling/tests/test_mstest.py
+++ b/paddlex/ppdet/modeling/tests/test_mstest.py
@@ -1,62 +0,0 @@
 
															-#   Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
														
 
															-#
														
 
															-# Licensed under the Apache License, Version 2.0 (the "License");
														
 
															-# you may not use this file except in compliance with the License.
														
 
															-# You may obtain a copy of the License at
														
 
															-#
														
 
															-#     http://www.apache.org/licenses/LICENSE-2.0
														
 
															-#
														
 
															-# Unless required by applicable law or agreed to in writing, software
														
 
															-# distributed under the License is distributed on an "AS IS" BASIS,
														
 
															-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															-# See the License for the specific language governing permissions and
														
 
															-# limitations under the License.
														
 
															-
														
 
															-from __future__ import absolute_import
														
 
															-from __future__ import division
														
 
															-from __future__ import print_function
														
 
															-
														
 
															-import os
														
 
															-import unittest
														
 
															-from paddlex.ppdet.core.workspace import load_config
														
 
															-from paddlex.ppdet.engine import Trainer
														
 
															-
														
 
															-
														
 
															-class TestMultiScaleInference(unittest.TestCase):
														
 
															-    def setUp(self):
														
 
															-        self.set_config()
														
 
															-
														
 
															-    def set_config(self):
														
 
															-        self.mstest_cfg_file = 'configs/faster_rcnn/faster_rcnn_r34_fpn_multiscaletest_1x_coco.yml'
														
 
															-
														
 
															-    # test evaluation with multi scale test
														
 
															-    def test_eval_mstest(self):
														
 
															-        cfg = load_config(self.mstest_cfg_file)
														
 
															-        trainer = Trainer(cfg, mode='eval')
														
 
															-
														
 
															-        cfg.weights = 'https://paddledet.bj.bcebos.com/models/faster_rcnn_r34_fpn_1x_coco.pdparams'
														
 
															-        trainer.load_weights(cfg.weights)
														
 
															-
														
 
															-        trainer.evaluate()
														
 
															-
														
 
															-    # test inference with multi scale test
														
 
															-    def test_infer_mstest(self):
														
 
															-        cfg = load_config(self.mstest_cfg_file)
														
 
															-        trainer = Trainer(cfg, mode='test')
														
 
															-
														
 
															-        cfg.weights = 'https://paddledet.bj.bcebos.com/models/faster_rcnn_r34_fpn_1x_coco.pdparams'
														
 
															-        trainer.load_weights(cfg.weights)
														
 
															-        tests_img_root = os.path.join(os.path.dirname(__file__), 'imgs')
														
 
															-
														
 
															-        # input images to predict
														
 
															-        imgs = [
														
 
															-            'coco2017_val2017_000000000139.jpg',
														
 
															-            'coco2017_val2017_000000000724.jpg'
														
 
															-        ]
														
 
															-        imgs = [os.path.join(tests_img_root, img) for img in imgs]
														
 
															-        trainer.predict(
														
 
															-            imgs, draw_threshold=0.5, output_dir='output', save_txt=True)
														
 
															-
														
 
															-
														
 
															-if __name__ == '__main__':
														
 
															-    unittest.main()
														
--- a/paddlex/ppdet/modeling/tests/test_ops.py
+++ b/paddlex/ppdet/modeling/tests/test_ops.py
@@ -1,838 +0,0 @@
 
															-#   Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
														
 
															-#
														
 
															-# Licensed under the Apache License, Version 2.0 (the "License");
														
 
															-# you may not use this file except in compliance with the License.
														
 
															-# You may obtain a copy of the License at
														
 
															-#
														
 
															-#     http://www.apache.org/licenses/LICENSE-2.0
														
 
															-#
														
 
															-# Unless required by applicable law or agreed to in writing, software
														
 
															-# distributed under the License is distributed on an "AS IS" BASIS,
														
 
															-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															-# See the License for the specific language governing permissions and
														
 
															-# limitations under the License.
														
 
															-
														
 
															-from __future__ import print_function
														
 
															-import os, sys
														
 
															-# add python path of PadleDetection to sys.path
														
 
															-parent_path = os.path.abspath(os.path.join(__file__, *(['..'] * 4)))
														
 
															-if parent_path not in sys.path:
														
 
															-    sys.path.append(parent_path)
														
 
															-
														
 
															-import unittest
														
 
															-import numpy as np
														
 
															-
														
 
															-import paddle
														
 
															-import paddle.fluid as fluid
														
 
															-from paddle.fluid.dygraph import base
														
 
															-
														
 
															-import paddlex.ppdet.modeling.ops as ops
														
 
															-from paddlex.ppdet.modeling.tests.test_base import LayerTest
														
 
															-
														
 
															-
														
 
															-def make_rois(h, w, rois_num, output_size):
														
 
															-    rois = np.zeros((0, 4)).astype('float32')
														
 
															-    for roi_num in rois_num:
														
 
															-        roi = np.zeros((roi_num, 4)).astype('float32')
														
 
															-        roi[:, 0] = np.random.randint(0, h - output_size[0], size=roi_num)
														
 
															-        roi[:, 1] = np.random.randint(0, w - output_size[1], size=roi_num)
														
 
															-        roi[:, 2] = np.random.randint(roi[:, 0] + output_size[0], h)
														
 
															-        roi[:, 3] = np.random.randint(roi[:, 1] + output_size[1], w)
														
 
															-        rois = np.vstack((rois, roi))
														
 
															-    return rois
														
 
															-
														
 
															-
														
 
															-def softmax(x):
														
 
															-    # clip to shiftx, otherwise, when calc loss with
														
 
															-    # log(exp(shiftx)), may get log(0)=INF
														
 
															-    shiftx = (x - np.max(x)).clip(-64.)
														
 
															-    exps = np.exp(shiftx)
														
 
															-    return exps / np.sum(exps)
														
 
															-
														
 
															-
														
 
															-class TestCollectFpnProposals(LayerTest):
														
 
															-    def test_collect_fpn_proposals(self):
														
 
															-        multi_bboxes_np = []
														
 
															-        multi_scores_np = []
														
 
															-        rois_num_per_level_np = []
														
 
															-        for i in range(4):
														
 
															-            bboxes_np = np.random.rand(5, 4).astype('float32')
														
 
															-            scores_np = np.random.rand(5, 1).astype('float32')
														
 
															-            rois_num = np.array([2, 3]).astype('int32')
														
 
															-            multi_bboxes_np.append(bboxes_np)
														
 
															-            multi_scores_np.append(scores_np)
														
 
															-            rois_num_per_level_np.append(rois_num)
														
 
															-
														
 
															-        with self.static_graph():
														
 
															-            multi_bboxes = []
														
 
															-            multi_scores = []
														
 
															-            rois_num_per_level = []
														
 
															-            for i in range(4):
														
 
															-                bboxes = paddle.static.data(
														
 
															-                    name='rois' + str(i),
														
 
															-                    shape=[5, 4],
														
 
															-                    dtype='float32',
														
 
															-                    lod_level=1)
														
 
															-                scores = paddle.static.data(
														
 
															-                    name='scores' + str(i),
														
 
															-                    shape=[5, 1],
														
 
															-                    dtype='float32',
														
 
															-                    lod_level=1)
														
 
															-                rois_num = paddle.static.data(
														
 
															-                    name='rois_num' + str(i), shape=[None], dtype='int32')
														
 
															-
														
 
															-                multi_bboxes.append(bboxes)
														
 
															-                multi_scores.append(scores)
														
 
															-                rois_num_per_level.append(rois_num)
														
 
															-
														
 
															-            fpn_rois, rois_num = ops.collect_fpn_proposals(
														
 
															-                multi_bboxes,
														
 
															-                multi_scores,
														
 
															-                2,
														
 
															-                5,
														
 
															-                10,
														
 
															-                rois_num_per_level=rois_num_per_level)
														
 
															-            feed = {}
														
 
															-            for i in range(4):
														
 
															-                feed['rois' + str(i)] = multi_bboxes_np[i]
														
 
															-                feed['scores' + str(i)] = multi_scores_np[i]
														
 
															-                feed['rois_num' + str(i)] = rois_num_per_level_np[i]
														
 
															-            fpn_rois_stat, rois_num_stat = self.get_static_graph_result(
														
 
															-                feed=feed, fetch_list=[fpn_rois, rois_num], with_lod=True)
														
 
															-            fpn_rois_stat = np.array(fpn_rois_stat)
														
 
															-            rois_num_stat = np.array(rois_num_stat)
														
 
															-
														
 
															-        with self.dynamic_graph():
														
 
															-            multi_bboxes_dy = []
														
 
															-            multi_scores_dy = []
														
 
															-            rois_num_per_level_dy = []
														
 
															-            for i in range(4):
														
 
															-                bboxes_dy = base.to_variable(multi_bboxes_np[i])
														
 
															-                scores_dy = base.to_variable(multi_scores_np[i])
														
 
															-                rois_num_dy = base.to_variable(rois_num_per_level_np[i])
														
 
															-                multi_bboxes_dy.append(bboxes_dy)
														
 
															-                multi_scores_dy.append(scores_dy)
														
 
															-                rois_num_per_level_dy.append(rois_num_dy)
														
 
															-            fpn_rois_dy, rois_num_dy = ops.collect_fpn_proposals(
														
 
															-                multi_bboxes_dy,
														
 
															-                multi_scores_dy,
														
 
															-                2,
														
 
															-                5,
														
 
															-                10,
														
 
															-                rois_num_per_level=rois_num_per_level_dy)
														
 
															-            fpn_rois_dy = fpn_rois_dy.numpy()
														
 
															-            rois_num_dy = rois_num_dy.numpy()
														
 
															-
														
 
															-        self.assertTrue(np.array_equal(fpn_rois_stat, fpn_rois_dy))
														
 
															-        self.assertTrue(np.array_equal(rois_num_stat, rois_num_dy))
														
 
															-
														
 
															-    def test_collect_fpn_proposals_error(self):
														
 
															-        def generate_input(bbox_type, score_type, name):
														
 
															-            multi_bboxes = []
														
 
															-            multi_scores = []
														
 
															-            for i in range(4):
														
 
															-                bboxes = paddle.static.data(
														
 
															-                    name='rois' + name + str(i),
														
 
															-                    shape=[10, 4],
														
 
															-                    dtype=bbox_type,
														
 
															-                    lod_level=1)
														
 
															-                scores = paddle.static.data(
														
 
															-                    name='scores' + name + str(i),
														
 
															-                    shape=[10, 1],
														
 
															-                    dtype=score_type,
														
 
															-                    lod_level=1)
														
 
															-                multi_bboxes.append(bboxes)
														
 
															-                multi_scores.append(scores)
														
 
															-            return multi_bboxes, multi_scores
														
 
															-
														
 
															-        with self.static_graph():
														
 
															-            bbox1 = paddle.static.data(
														
 
															-                name='rois', shape=[5, 10, 4], dtype='float32', lod_level=1)
														
 
															-            score1 = paddle.static.data(
														
 
															-                name='scores', shape=[5, 10, 1], dtype='float32', lod_level=1)
														
 
															-            bbox2, score2 = generate_input('int32', 'float32', '2')
														
 
															-            self.assertRaises(
														
 
															-                TypeError,
														
 
															-                ops.collect_fpn_proposals,
														
 
															-                multi_rois=bbox1,
														
 
															-                multi_scores=score1,
														
 
															-                min_level=2,
														
 
															-                max_level=5,
														
 
															-                post_nms_top_n=2000)
														
 
															-            self.assertRaises(
														
 
															-                TypeError,
														
 
															-                ops.collect_fpn_proposals,
														
 
															-                multi_rois=bbox2,
														
 
															-                multi_scores=score2,
														
 
															-                min_level=2,
														
 
															-                max_level=5,
														
 
															-                post_nms_top_n=2000)
														
 
															-
														
 
															-        paddle.disable_static()
														
 
															-
														
 
															-
														
 
															-class TestDistributeFpnProposals(LayerTest):
														
 
															-    def test_distribute_fpn_proposals(self):
														
 
															-        rois_np = np.random.rand(10, 4).astype('float32')
														
 
															-        rois_num_np = np.array([4, 6]).astype('int32')
														
 
															-        with self.static_graph():
														
 
															-            rois = paddle.static.data(
														
 
															-                name='rois', shape=[10, 4], dtype='float32')
														
 
															-            rois_num = paddle.static.data(
														
 
															-                name='rois_num', shape=[None], dtype='int32')
														
 
															-            multi_rois, restore_ind, rois_num_per_level = ops.distribute_fpn_proposals(
														
 
															-                fpn_rois=rois,
														
 
															-                min_level=2,
														
 
															-                max_level=5,
														
 
															-                refer_level=4,
														
 
															-                refer_scale=224,
														
 
															-                rois_num=rois_num)
														
 
															-            fetch_list = multi_rois + [restore_ind] + rois_num_per_level
														
 
															-            output_stat = self.get_static_graph_result(
														
 
															-                feed={'rois': rois_np,
														
 
															-                      'rois_num': rois_num_np},
														
 
															-                fetch_list=fetch_list,
														
 
															-                with_lod=True)
														
 
															-            output_stat_np = []
														
 
															-            for output in output_stat:
														
 
															-                output_np = np.array(output)
														
 
															-                if len(output_np) > 0:
														
 
															-                    output_stat_np.append(output_np)
														
 
															-
														
 
															-        with self.dynamic_graph():
														
 
															-            rois_dy = base.to_variable(rois_np)
														
 
															-            rois_num_dy = base.to_variable(rois_num_np)
														
 
															-            multi_rois_dy, restore_ind_dy, rois_num_per_level_dy = ops.distribute_fpn_proposals(
														
 
															-                fpn_rois=rois_dy,
														
 
															-                min_level=2,
														
 
															-                max_level=5,
														
 
															-                refer_level=4,
														
 
															-                refer_scale=224,
														
 
															-                rois_num=rois_num_dy)
														
 
															-            output_dy = multi_rois_dy + [restore_ind_dy
														
 
															-                                         ] + rois_num_per_level_dy
														
 
															-            output_dy_np = []
														
 
															-            for output in output_dy:
														
 
															-                output_np = output.numpy()
														
 
															-                if len(output_np) > 0:
														
 
															-                    output_dy_np.append(output_np)
														
 
															-
														
 
															-        for res_stat, res_dy in zip(output_stat_np, output_dy_np):
														
 
															-            self.assertTrue(np.array_equal(res_stat, res_dy))
														
 
															-
														
 
															-    def test_distribute_fpn_proposals_error(self):
														
 
															-        with self.static_graph():
														
 
															-            fpn_rois = paddle.static.data(
														
 
															-                name='data_error', shape=[10, 4], dtype='int32', lod_level=1)
														
 
															-            self.assertRaises(
														
 
															-                TypeError,
														
 
															-                ops.distribute_fpn_proposals,
														
 
															-                fpn_rois=fpn_rois,
														
 
															-                min_level=2,
														
 
															-                max_level=5,
														
 
															-                refer_level=4,
														
 
															-                refer_scale=224)
														
 
															-
														
 
															-        paddle.disable_static()
														
 
															-
														
 
															-
														
 
															-class TestROIAlign(LayerTest):
														
 
															-    def test_roi_align(self):
														
 
															-        b, c, h, w = 2, 12, 20, 20
														
 
															-        inputs_np = np.random.rand(b, c, h, w).astype('float32')
														
 
															-        rois_num = [4, 6]
														
 
															-        output_size = (7, 7)
														
 
															-        rois_np = make_rois(h, w, rois_num, output_size)
														
 
															-        rois_num_np = np.array(rois_num).astype('int32')
														
 
															-        with self.static_graph():
														
 
															-            inputs = paddle.static.data(
														
 
															-                name='inputs', shape=[b, c, h, w], dtype='float32')
														
 
															-            rois = paddle.static.data(
														
 
															-                name='rois', shape=[10, 4], dtype='float32')
														
 
															-            rois_num = paddle.static.data(
														
 
															-                name='rois_num', shape=[None], dtype='int32')
														
 
															-
														
 
															-            output = ops.roi_align(
														
 
															-                input=inputs,
														
 
															-                rois=rois,
														
 
															-                output_size=output_size,
														
 
															-                rois_num=rois_num)
														
 
															-            output_np, = self.get_static_graph_result(
														
 
															-                feed={
														
 
															-                    'inputs': inputs_np,
														
 
															-                    'rois': rois_np,
														
 
															-                    'rois_num': rois_num_np
														
 
															-                },
														
 
															-                fetch_list=output,
														
 
															-                with_lod=False)
														
 
															-
														
 
															-        with self.dynamic_graph():
														
 
															-            inputs_dy = base.to_variable(inputs_np)
														
 
															-            rois_dy = base.to_variable(rois_np)
														
 
															-            rois_num_dy = base.to_variable(rois_num_np)
														
 
															-
														
 
															-            output_dy = ops.roi_align(
														
 
															-                input=inputs_dy,
														
 
															-                rois=rois_dy,
														
 
															-                output_size=output_size,
														
 
															-                rois_num=rois_num_dy)
														
 
															-            output_dy_np = output_dy.numpy()
														
 
															-
														
 
															-        self.assertTrue(np.array_equal(output_np, output_dy_np))
														
 
															-
														
 
															-    def test_roi_align_error(self):
														
 
															-        with self.static_graph():
														
 
															-            inputs = paddle.static.data(
														
 
															-                name='inputs', shape=[2, 12, 20, 20], dtype='float32')
														
 
															-            rois = paddle.static.data(
														
 
															-                name='data_error', shape=[10, 4], dtype='int32', lod_level=1)
														
 
															-            self.assertRaises(
														
 
															-                TypeError,
														
 
															-                ops.roi_align,
														
 
															-                input=inputs,
														
 
															-                rois=rois,
														
 
															-                output_size=(7, 7))
														
 
															-
														
 
															-        paddle.disable_static()
														
 
															-
														
 
															-
														
 
															-class TestROIPool(LayerTest):
														
 
															-    def test_roi_pool(self):
														
 
															-        b, c, h, w = 2, 12, 20, 20
														
 
															-        inputs_np = np.random.rand(b, c, h, w).astype('float32')
														
 
															-        rois_num = [4, 6]
														
 
															-        output_size = (7, 7)
														
 
															-        rois_np = make_rois(h, w, rois_num, output_size)
														
 
															-        rois_num_np = np.array(rois_num).astype('int32')
														
 
															-        with self.static_graph():
														
 
															-            inputs = paddle.static.data(
														
 
															-                name='inputs', shape=[b, c, h, w], dtype='float32')
														
 
															-            rois = paddle.static.data(
														
 
															-                name='rois', shape=[10, 4], dtype='float32')
														
 
															-            rois_num = paddle.static.data(
														
 
															-                name='rois_num', shape=[None], dtype='int32')
														
 
															-
														
 
															-            output, _ = ops.roi_pool(
														
 
															-                input=inputs,
														
 
															-                rois=rois,
														
 
															-                output_size=output_size,
														
 
															-                rois_num=rois_num)
														
 
															-            output_np, = self.get_static_graph_result(
														
 
															-                feed={
														
 
															-                    'inputs': inputs_np,
														
 
															-                    'rois': rois_np,
														
 
															-                    'rois_num': rois_num_np
														
 
															-                },
														
 
															-                fetch_list=[output],
														
 
															-                with_lod=False)
														
 
															-
														
 
															-        with self.dynamic_graph():
														
 
															-            inputs_dy = base.to_variable(inputs_np)
														
 
															-            rois_dy = base.to_variable(rois_np)
														
 
															-            rois_num_dy = base.to_variable(rois_num_np)
														
 
															-
														
 
															-            output_dy, _ = ops.roi_pool(
														
 
															-                input=inputs_dy,
														
 
															-                rois=rois_dy,
														
 
															-                output_size=output_size,
														
 
															-                rois_num=rois_num_dy)
														
 
															-            output_dy_np = output_dy.numpy()
														
 
															-
														
 
															-        self.assertTrue(np.array_equal(output_np, output_dy_np))
														
 
															-
														
 
															-    def test_roi_pool_error(self):
														
 
															-        with self.static_graph():
														
 
															-            inputs = paddle.static.data(
														
 
															-                name='inputs', shape=[2, 12, 20, 20], dtype='float32')
														
 
															-            rois = paddle.static.data(
														
 
															-                name='data_error', shape=[10, 4], dtype='int32', lod_level=1)
														
 
															-            self.assertRaises(
														
 
															-                TypeError,
														
 
															-                ops.roi_pool,
														
 
															-                input=inputs,
														
 
															-                rois=rois,
														
 
															-                output_size=(7, 7))
														
 
															-
														
 
															-        paddle.disable_static()
														
 
															-
														
 
															-
														
 
															-class TestIoUSimilarity(LayerTest):
														
 
															-    def test_iou_similarity(self):
														
 
															-        b, c, h, w = 2, 12, 20, 20
														
 
															-        inputs_np = np.random.rand(b, c, h, w).astype('float32')
														
 
															-        output_size = (7, 7)
														
 
															-        x_np = make_rois(h, w, [20], output_size)
														
 
															-        y_np = make_rois(h, w, [10], output_size)
														
 
															-        with self.static_graph():
														
 
															-            x = paddle.static.data(name='x', shape=[20, 4], dtype='float32')
														
 
															-            y = paddle.static.data(name='y', shape=[10, 4], dtype='float32')
														
 
															-
														
 
															-            iou = ops.iou_similarity(x=x, y=y)
														
 
															-            iou_np, = self.get_static_graph_result(
														
 
															-                feed={
														
 
															-                    'x': x_np,
														
 
															-                    'y': y_np,
														
 
															-                },
														
 
															-                fetch_list=[iou],
														
 
															-                with_lod=False)
														
 
															-
														
 
															-        with self.dynamic_graph():
														
 
															-            x_dy = base.to_variable(x_np)
														
 
															-            y_dy = base.to_variable(y_np)
														
 
															-
														
 
															-            iou_dy = ops.iou_similarity(x=x_dy, y=y_dy)
														
 
															-            iou_dy_np = iou_dy.numpy()
														
 
															-
														
 
															-        self.assertTrue(np.array_equal(iou_np, iou_dy_np))
														
 
															-
														
 
															-
														
 
															-class TestBipartiteMatch(LayerTest):
														
 
															-    def test_bipartite_match(self):
														
 
															-        distance = np.random.random((20, 10)).astype('float32')
														
 
															-        with self.static_graph():
														
 
															-            x = paddle.static.data(name='x', shape=[20, 10], dtype='float32')
														
 
															-
														
 
															-            match_indices, match_dist = ops.bipartite_match(
														
 
															-                x, match_type='per_prediction', dist_threshold=0.5)
														
 
															-            match_indices_np, match_dist_np = self.get_static_graph_result(
														
 
															-                feed={'x': distance, },
														
 
															-                fetch_list=[match_indices, match_dist],
														
 
															-                with_lod=False)
														
 
															-
														
 
															-        with self.dynamic_graph():
														
 
															-            x_dy = base.to_variable(distance)
														
 
															-
														
 
															-            match_indices_dy, match_dist_dy = ops.bipartite_match(
														
 
															-                x_dy, match_type='per_prediction', dist_threshold=0.5)
														
 
															-            match_indices_dy_np = match_indices_dy.numpy()
														
 
															-            match_dist_dy_np = match_dist_dy.numpy()
														
 
															-
														
 
															-        self.assertTrue(np.array_equal(match_indices_np, match_indices_dy_np))
														
 
															-        self.assertTrue(np.array_equal(match_dist_np, match_dist_dy_np))
														
 
															-
														
 
															-
														
 
															-class TestYoloBox(LayerTest):
														
 
															-    def test_yolo_box(self):
														
 
															-
														
 
															-        # x shape [N C H W], C=K * (5 + class_num), class_num=10, K=2
														
 
															-        np_x = np.random.random([1, 30, 7, 7]).astype('float32')
														
 
															-        np_origin_shape = np.array([[608, 608]], dtype='int32')
														
 
															-        class_num = 10
														
 
															-        conf_thresh = 0.01
														
 
															-        downsample_ratio = 32
														
 
															-        scale_x_y = 1.2
														
 
															-
														
 
															-        # static
														
 
															-        with self.static_graph():
														
 
															-            # x shape [N C H W], C=K * (5 + class_num), class_num=10, K=2
														
 
															-            x = paddle.static.data(
														
 
															-                name='x', shape=[1, 30, 7, 7], dtype='float32')
														
 
															-            origin_shape = paddle.static.data(
														
 
															-                name='origin_shape', shape=[1, 2], dtype='int32')
														
 
															-
														
 
															-            boxes, scores = ops.yolo_box(
														
 
															-                x,
														
 
															-                origin_shape, [10, 13, 30, 13],
														
 
															-                class_num,
														
 
															-                conf_thresh,
														
 
															-                downsample_ratio,
														
 
															-                scale_x_y=scale_x_y)
														
 
															-
														
 
															-            boxes_np, scores_np = self.get_static_graph_result(
														
 
															-                feed={
														
 
															-                    'x': np_x,
														
 
															-                    'origin_shape': np_origin_shape,
														
 
															-                },
														
 
															-                fetch_list=[boxes, scores],
														
 
															-                with_lod=False)
														
 
															-
														
 
															-        # dygraph
														
 
															-        with self.dynamic_graph():
														
 
															-            x_dy = fluid.layers.assign(np_x)
														
 
															-            origin_shape_dy = fluid.layers.assign(np_origin_shape)
														
 
															-
														
 
															-            boxes_dy, scores_dy = ops.yolo_box(
														
 
															-                x_dy,
														
 
															-                origin_shape_dy, [10, 13, 30, 13],
														
 
															-                10,
														
 
															-                0.01,
														
 
															-                32,
														
 
															-                scale_x_y=scale_x_y)
														
 
															-
														
 
															-            boxes_dy_np = boxes_dy.numpy()
														
 
															-            scores_dy_np = scores_dy.numpy()
														
 
															-
														
 
															-        self.assertTrue(np.array_equal(boxes_np, boxes_dy_np))
														
 
															-        self.assertTrue(np.array_equal(scores_np, scores_dy_np))
														
 
															-
														
 
															-    def test_yolo_box_error(self):
														
 
															-        with self.static_graph():
														
 
															-            # x shape [N C H W], C=K * (5 + class_num), class_num=10, K=2
														
 
															-            x = paddle.static.data(
														
 
															-                name='x', shape=[1, 30, 7, 7], dtype='float32')
														
 
															-            origin_shape = paddle.static.data(
														
 
															-                name='origin_shape', shape=[1, 2], dtype='int32')
														
 
															-
														
 
															-            self.assertRaises(
														
 
															-                TypeError,
														
 
															-                ops.yolo_box,
														
 
															-                x,
														
 
															-                origin_shape, [10, 13, 30, 13],
														
 
															-                10.123,
														
 
															-                0.01,
														
 
															-                32,
														
 
															-                scale_x_y=1.2)
														
 
															-
														
 
															-        paddle.disable_static()
														
 
															-
														
 
															-
														
 
															-class TestPriorBox(LayerTest):
														
 
															-    def test_prior_box(self):
														
 
															-        input_np = np.random.rand(2, 10, 32, 32).astype('float32')
														
 
															-        image_np = np.random.rand(2, 10, 40, 40).astype('float32')
														
 
															-        min_sizes = [2, 4]
														
 
															-        with self.static_graph():
														
 
															-            input = paddle.static.data(
														
 
															-                name='input', shape=[2, 10, 32, 32], dtype='float32')
														
 
															-            image = paddle.static.data(
														
 
															-                name='image', shape=[2, 10, 40, 40], dtype='float32')
														
 
															-
														
 
															-            box, var = ops.prior_box(
														
 
															-                input=input,
														
 
															-                image=image,
														
 
															-                min_sizes=min_sizes,
														
 
															-                clip=True,
														
 
															-                flip=True)
														
 
															-            box_np, var_np = self.get_static_graph_result(
														
 
															-                feed={
														
 
															-                    'input': input_np,
														
 
															-                    'image': image_np,
														
 
															-                },
														
 
															-                fetch_list=[box, var],
														
 
															-                with_lod=False)
														
 
															-
														
 
															-        with self.dynamic_graph():
														
 
															-            inputs_dy = base.to_variable(input_np)
														
 
															-            image_dy = base.to_variable(image_np)
														
 
															-
														
 
															-            box_dy, var_dy = ops.prior_box(
														
 
															-                input=inputs_dy,
														
 
															-                image=image_dy,
														
 
															-                min_sizes=min_sizes,
														
 
															-                clip=True,
														
 
															-                flip=True)
														
 
															-            box_dy_np = box_dy.numpy()
														
 
															-            var_dy_np = var_dy.numpy()
														
 
															-
														
 
															-        self.assertTrue(np.array_equal(box_np, box_dy_np))
														
 
															-        self.assertTrue(np.array_equal(var_np, var_dy_np))
														
 
															-
														
 
															-    def test_prior_box_error(self):
														
 
															-        with self.static_graph():
														
 
															-            input = paddle.static.data(
														
 
															-                name='input', shape=[2, 10, 32, 32], dtype='int32')
														
 
															-            image = paddle.static.data(
														
 
															-                name='image', shape=[2, 10, 40, 40], dtype='int32')
														
 
															-            self.assertRaises(
														
 
															-                TypeError,
														
 
															-                ops.prior_box,
														
 
															-                input=input,
														
 
															-                image=image,
														
 
															-                min_sizes=[2, 4],
														
 
															-                clip=True,
														
 
															-                flip=True)
														
 
															-
														
 
															-        paddle.disable_static()
														
 
															-
														
 
															-
														
 
															-class TestMulticlassNms(LayerTest):
														
 
															-    def test_multiclass_nms(self):
														
 
															-        boxes_np = np.random.rand(10, 81, 4).astype('float32')
														
 
															-        scores_np = np.random.rand(10, 81).astype('float32')
														
 
															-        rois_num_np = np.array([2, 8]).astype('int32')
														
 
															-        with self.static_graph():
														
 
															-            boxes = paddle.static.data(
														
 
															-                name='bboxes',
														
 
															-                shape=[None, 81, 4],
														
 
															-                dtype='float32',
														
 
															-                lod_level=1)
														
 
															-            scores = paddle.static.data(
														
 
															-                name='scores', shape=[None, 81], dtype='float32', lod_level=1)
														
 
															-            rois_num = paddle.static.data(
														
 
															-                name='rois_num', shape=[None], dtype='int32')
														
 
															-
														
 
															-            output = ops.multiclass_nms(
														
 
															-                bboxes=boxes,
														
 
															-                scores=scores,
														
 
															-                background_label=0,
														
 
															-                score_threshold=0.5,
														
 
															-                nms_top_k=400,
														
 
															-                nms_threshold=0.3,
														
 
															-                keep_top_k=200,
														
 
															-                normalized=False,
														
 
															-                return_index=True,
														
 
															-                rois_num=rois_num)
														
 
															-            out_np, index_np, nms_rois_num_np = self.get_static_graph_result(
														
 
															-                feed={
														
 
															-                    'bboxes': boxes_np,
														
 
															-                    'scores': scores_np,
														
 
															-                    'rois_num': rois_num_np
														
 
															-                },
														
 
															-                fetch_list=output,
														
 
															-                with_lod=True)
														
 
															-            out_np = np.array(out_np)
														
 
															-            index_np = np.array(index_np)
														
 
															-            nms_rois_num_np = np.array(nms_rois_num_np)
														
 
															-
														
 
															-        with self.dynamic_graph():
														
 
															-            boxes_dy = base.to_variable(boxes_np)
														
 
															-            scores_dy = base.to_variable(scores_np)
														
 
															-            rois_num_dy = base.to_variable(rois_num_np)
														
 
															-
														
 
															-            out_dy, index_dy, nms_rois_num_dy = ops.multiclass_nms(
														
 
															-                bboxes=boxes_dy,
														
 
															-                scores=scores_dy,
														
 
															-                background_label=0,
														
 
															-                score_threshold=0.5,
														
 
															-                nms_top_k=400,
														
 
															-                nms_threshold=0.3,
														
 
															-                keep_top_k=200,
														
 
															-                normalized=False,
														
 
															-                return_index=True,
														
 
															-                rois_num=rois_num_dy)
														
 
															-            out_dy_np = out_dy.numpy()
														
 
															-            index_dy_np = index_dy.numpy()
														
 
															-            nms_rois_num_dy_np = nms_rois_num_dy.numpy()
														
 
															-
														
 
															-        self.assertTrue(np.array_equal(out_np, out_dy_np))
														
 
															-        self.assertTrue(np.array_equal(index_np, index_dy_np))
														
 
															-        self.assertTrue(np.array_equal(nms_rois_num_np, nms_rois_num_dy_np))
														
 
															-
														
 
															-    def test_multiclass_nms_error(self):
														
 
															-        with self.static_graph():
														
 
															-            boxes = paddle.static.data(
														
 
															-                name='bboxes', shape=[81, 4], dtype='float32', lod_level=1)
														
 
															-            scores = paddle.static.data(
														
 
															-                name='scores', shape=[81], dtype='float32', lod_level=1)
														
 
															-            rois_num = paddle.static.data(
														
 
															-                name='rois_num', shape=[40, 41], dtype='int32')
														
 
															-            self.assertRaises(
														
 
															-                TypeError,
														
 
															-                ops.multiclass_nms,
														
 
															-                boxes=boxes,
														
 
															-                scores=scores,
														
 
															-                background_label=0,
														
 
															-                score_threshold=0.5,
														
 
															-                nms_top_k=400,
														
 
															-                nms_threshold=0.3,
														
 
															-                keep_top_k=200,
														
 
															-                normalized=False,
														
 
															-                return_index=True,
														
 
															-                rois_num=rois_num)
														
 
															-
														
 
															-
														
 
															-class TestMatrixNMS(LayerTest):
														
 
															-    def test_matrix_nms(self):
														
 
															-        N, M, C = 7, 1200, 21
														
 
															-        BOX_SIZE = 4
														
 
															-        nms_top_k = 400
														
 
															-        keep_top_k = 200
														
 
															-        score_threshold = 0.01
														
 
															-        post_threshold = 0.
														
 
															-
														
 
															-        scores_np = np.random.random((N * M, C)).astype('float32')
														
 
															-        scores_np = np.apply_along_axis(softmax, 1, scores_np)
														
 
															-        scores_np = np.reshape(scores_np, (N, M, C))
														
 
															-        scores_np = np.transpose(scores_np, (0, 2, 1))
														
 
															-
														
 
															-        boxes_np = np.random.random((N, M, BOX_SIZE)).astype('float32')
														
 
															-        boxes_np[:, :, 0:2] = boxes_np[:, :, 0:2] * 0.5
														
 
															-        boxes_np[:, :, 2:4] = boxes_np[:, :, 2:4] * 0.5 + 0.5
														
 
															-
														
 
															-        with self.static_graph():
														
 
															-            boxes = paddle.static.data(
														
 
															-                name='boxes', shape=[N, M, BOX_SIZE], dtype='float32')
														
 
															-            scores = paddle.static.data(
														
 
															-                name='scores', shape=[N, C, M], dtype='float32')
														
 
															-            out, index, _ = ops.matrix_nms(
														
 
															-                bboxes=boxes,
														
 
															-                scores=scores,
														
 
															-                score_threshold=score_threshold,
														
 
															-                post_threshold=post_threshold,
														
 
															-                nms_top_k=nms_top_k,
														
 
															-                keep_top_k=keep_top_k,
														
 
															-                return_index=True)
														
 
															-            out_np, index_np = self.get_static_graph_result(
														
 
															-                feed={'boxes': boxes_np,
														
 
															-                      'scores': scores_np},
														
 
															-                fetch_list=[out, index],
														
 
															-                with_lod=True)
														
 
															-
														
 
															-        with self.dynamic_graph():
														
 
															-            boxes_dy = base.to_variable(boxes_np)
														
 
															-            scores_dy = base.to_variable(scores_np)
														
 
															-
														
 
															-            out_dy, index_dy, _ = ops.matrix_nms(
														
 
															-                bboxes=boxes_dy,
														
 
															-                scores=scores_dy,
														
 
															-                score_threshold=score_threshold,
														
 
															-                post_threshold=post_threshold,
														
 
															-                nms_top_k=nms_top_k,
														
 
															-                keep_top_k=keep_top_k,
														
 
															-                return_index=True)
														
 
															-            out_dy_np = out_dy.numpy()
														
 
															-            index_dy_np = index_dy.numpy()
														
 
															-
														
 
															-        self.assertTrue(np.array_equal(out_np, out_dy_np))
														
 
															-        self.assertTrue(np.array_equal(index_np, index_dy_np))
														
 
															-
														
 
															-    def test_matrix_nms_error(self):
														
 
															-        with self.static_graph():
														
 
															-            bboxes = paddle.static.data(
														
 
															-                name='bboxes', shape=[7, 1200, 4], dtype='float32')
														
 
															-            scores = paddle.static.data(
														
 
															-                name='data_error', shape=[7, 21, 1200], dtype='int32')
														
 
															-            self.assertRaises(
														
 
															-                TypeError,
														
 
															-                ops.matrix_nms,
														
 
															-                bboxes=bboxes,
														
 
															-                scores=scores,
														
 
															-                score_threshold=0.01,
														
 
															-                post_threshold=0.,
														
 
															-                nms_top_k=400,
														
 
															-                keep_top_k=200,
														
 
															-                return_index=True)
														
 
															-
														
 
															-        paddle.disable_static()
														
 
															-
														
 
															-
														
 
															-class TestBoxCoder(LayerTest):
														
 
															-    def test_box_coder(self):
														
 
															-
														
 
															-        prior_box_np = np.random.random((81, 4)).astype('float32')
														
 
															-        prior_box_var_np = np.random.random((81, 4)).astype('float32')
														
 
															-        target_box_np = np.random.random((20, 81, 4)).astype('float32')
														
 
															-
														
 
															-        # static
														
 
															-        with self.static_graph():
														
 
															-            prior_box = paddle.static.data(
														
 
															-                name='prior_box', shape=[81, 4], dtype='float32')
														
 
															-            prior_box_var = paddle.static.data(
														
 
															-                name='prior_box_var', shape=[81, 4], dtype='float32')
														
 
															-            target_box = paddle.static.data(
														
 
															-                name='target_box', shape=[20, 81, 4], dtype='float32')
														
 
															-
														
 
															-            boxes = ops.box_coder(
														
 
															-                prior_box=prior_box,
														
 
															-                prior_box_var=prior_box_var,
														
 
															-                target_box=target_box,
														
 
															-                code_type="decode_center_size",
														
 
															-                box_normalized=False)
														
 
															-
														
 
															-            boxes_np, = self.get_static_graph_result(
														
 
															-                feed={
														
 
															-                    'prior_box': prior_box_np,
														
 
															-                    'prior_box_var': prior_box_var_np,
														
 
															-                    'target_box': target_box_np,
														
 
															-                },
														
 
															-                fetch_list=[boxes],
														
 
															-                with_lod=False)
														
 
															-
														
 
															-        # dygraph
														
 
															-        with self.dynamic_graph():
														
 
															-            prior_box_dy = base.to_variable(prior_box_np)
														
 
															-            prior_box_var_dy = base.to_variable(prior_box_var_np)
														
 
															-            target_box_dy = base.to_variable(target_box_np)
														
 
															-
														
 
															-            boxes_dy = ops.box_coder(
														
 
															-                prior_box=prior_box_dy,
														
 
															-                prior_box_var=prior_box_var_dy,
														
 
															-                target_box=target_box_dy,
														
 
															-                code_type="decode_center_size",
														
 
															-                box_normalized=False)
														
 
															-
														
 
															-            boxes_dy_np = boxes_dy.numpy()
														
 
															-
														
 
															-            self.assertTrue(np.array_equal(boxes_np, boxes_dy_np))
														
 
															-
														
 
															-    def test_box_coder_error(self):
														
 
															-        with self.static_graph():
														
 
															-            prior_box = paddle.static.data(
														
 
															-                name='prior_box', shape=[81, 4], dtype='int32')
														
 
															-            prior_box_var = paddle.static.data(
														
 
															-                name='prior_box_var', shape=[81, 4], dtype='float32')
														
 
															-            target_box = paddle.static.data(
														
 
															-                name='target_box', shape=[20, 81, 4], dtype='float32')
														
 
															-
														
 
															-            self.assertRaises(TypeError, ops.box_coder, prior_box,
														
 
															-                              prior_box_var, target_box)
														
 
															-
														
 
															-        paddle.disable_static()
														
 
															-
														
 
															-
														
 
															-class TestGenerateProposals(LayerTest):
														
 
															-    def test_generate_proposals(self):
														
 
															-        scores_np = np.random.rand(2, 3, 4, 4).astype('float32')
														
 
															-        bbox_deltas_np = np.random.rand(2, 12, 4, 4).astype('float32')
														
 
															-        im_shape_np = np.array([[8, 8], [6, 6]]).astype('float32')
														
 
															-        anchors_np = np.reshape(np.arange(4 * 4 * 3 * 4),
														
 
															-                                [4, 4, 3, 4]).astype('float32')
														
 
															-        variances_np = np.ones((4, 4, 3, 4)).astype('float32')
														
 
															-
														
 
															-        with self.static_graph():
														
 
															-            scores = paddle.static.data(
														
 
															-                name='scores', shape=[2, 3, 4, 4], dtype='float32')
														
 
															-            bbox_deltas = paddle.static.data(
														
 
															-                name='bbox_deltas', shape=[2, 12, 4, 4], dtype='float32')
														
 
															-            im_shape = paddle.static.data(
														
 
															-                name='im_shape', shape=[2, 2], dtype='float32')
														
 
															-            anchors = paddle.static.data(
														
 
															-                name='anchors', shape=[4, 4, 3, 4], dtype='float32')
														
 
															-            variances = paddle.static.data(
														
 
															-                name='var', shape=[4, 4, 3, 4], dtype='float32')
														
 
															-            rois, roi_probs, rois_num = ops.generate_proposals(
														
 
															-                scores,
														
 
															-                bbox_deltas,
														
 
															-                im_shape,
														
 
															-                anchors,
														
 
															-                variances,
														
 
															-                pre_nms_top_n=10,
														
 
															-                post_nms_top_n=5,
														
 
															-                return_rois_num=True)
														
 
															-            rois_stat, roi_probs_stat, rois_num_stat = self.get_static_graph_result(
														
 
															-                feed={
														
 
															-                    'scores': scores_np,
														
 
															-                    'bbox_deltas': bbox_deltas_np,
														
 
															-                    'im_shape': im_shape_np,
														
 
															-                    'anchors': anchors_np,
														
 
															-                    'var': variances_np
														
 
															-                },
														
 
															-                fetch_list=[rois, roi_probs, rois_num],
														
 
															-                with_lod=True)
														
 
															-
														
 
															-        with self.dynamic_graph():
														
 
															-            scores_dy = base.to_variable(scores_np)
														
 
															-            bbox_deltas_dy = base.to_variable(bbox_deltas_np)
														
 
															-            im_shape_dy = base.to_variable(im_shape_np)
														
 
															-            anchors_dy = base.to_variable(anchors_np)
														
 
															-            variances_dy = base.to_variable(variances_np)
														
 
															-            rois, roi_probs, rois_num = ops.generate_proposals(
														
 
															-                scores_dy,
														
 
															-                bbox_deltas_dy,
														
 
															-                im_shape_dy,
														
 
															-                anchors_dy,
														
 
															-                variances_dy,
														
 
															-                pre_nms_top_n=10,
														
 
															-                post_nms_top_n=5,
														
 
															-                return_rois_num=True)
														
 
															-            rois_dy = rois.numpy()
														
 
															-            roi_probs_dy = roi_probs.numpy()
														
 
															-            rois_num_dy = rois_num.numpy()
														
 
															-
														
 
															-        self.assertTrue(np.array_equal(np.array(rois_stat), rois_dy))
														
 
															-        self.assertTrue(np.array_equal(np.array(roi_probs_stat), roi_probs_dy))
														
 
															-        self.assertTrue(np.array_equal(np.array(rois_num_stat), rois_num_dy))
														
 
															-
														
 
															-
														
 
															-if __name__ == '__main__':
														
 
															-    unittest.main()
														
--- a/paddlex/ppdet/modeling/tests/test_yolov3_loss.py
+++ b/paddlex/ppdet/modeling/tests/test_yolov3_loss.py
@@ -1,415 +0,0 @@
 
															-#   Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
														
 
															-#
														
 
															-# Licensed under the Apache License, Version 2.0 (the "License");
														
 
															-# you may not use this file except in compliance with the License.
														
 
															-# You may obtain a copy of the License at
														
 
															-#
														
 
															-#     http://www.apache.org/licenses/LICENSE-2.0
														
 
															-#
														
 
															-# Unless required by applicable law or agreed to in writing, software
														
 
															-# distributed under the License is distributed on an "AS IS" BASIS,
														
 
															-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
														
 
															-# See the License for the specific language governing permissions and
														
 
															-# limitations under the License.
														
 
															-
														
 
															-from __future__ import division
														
 
															-
														
 
															-import unittest
														
 
															-
														
 
															-import paddle
														
 
															-from paddle import fluid
														
 
															-# add python path of PadleDetection to sys.path
														
 
															-import os
														
 
															-import sys
														
 
															-parent_path = os.path.abspath(os.path.join(__file__, *(['..'] * 4)))
														
 
															-if parent_path not in sys.path:
														
 
															-    sys.path.append(parent_path)
														
 
															-
														
 
															-from paddlex.ppdet.modeling.losses import YOLOv3Loss
														
 
															-from paddlex.ppdet.data.transform.op_helper import jaccard_overlap
														
 
															-import numpy as np
														
 
															-
														
 
															-
														
 
															-def _split_ioup(output, an_num, num_classes):
														
 
															-    """
														
 
															-    Split output feature map to output, predicted iou
														
 
															-    along channel dimension
														
 
															-    """
														
 
															-    ioup = fluid.layers.slice(output, axes=[1], starts=[0], ends=[an_num])
														
 
															-    ioup = fluid.layers.sigmoid(ioup)
														
 
															-    oriout = fluid.layers.slice(
														
 
															-        output, axes=[1], starts=[an_num], ends=[an_num * (num_classes + 6)])
														
 
															-    return (ioup, oriout)
														
 
															-
														
 
															-
														
 
															-def _split_output(output, an_num, num_classes):
														
 
															-    """
														
 
															-    Split output feature map to x, y, w, h, objectness, classification
														
 
															-    along channel dimension
														
 
															-    """
														
 
															-    x = fluid.layers.strided_slice(
														
 
															-        output,
														
 
															-        axes=[1],
														
 
															-        starts=[0],
														
 
															-        ends=[output.shape[1]],
														
 
															-        strides=[5 + num_classes])
														
 
															-    y = fluid.layers.strided_slice(
														
 
															-        output,
														
 
															-        axes=[1],
														
 
															-        starts=[1],
														
 
															-        ends=[output.shape[1]],
														
 
															-        strides=[5 + num_classes])
														
 
															-    w = fluid.layers.strided_slice(
														
 
															-        output,
														
 
															-        axes=[1],
														
 
															-        starts=[2],
														
 
															-        ends=[output.shape[1]],
														
 
															-        strides=[5 + num_classes])
														
 
															-    h = fluid.layers.strided_slice(
														
 
															-        output,
														
 
															-        axes=[1],
														
 
															-        starts=[3],
														
 
															-        ends=[output.shape[1]],
														
 
															-        strides=[5 + num_classes])
														
 
															-    obj = fluid.layers.strided_slice(
														
 
															-        output,
														
 
															-        axes=[1],
														
 
															-        starts=[4],
														
 
															-        ends=[output.shape[1]],
														
 
															-        strides=[5 + num_classes])
														
 
															-    clss = []
														
 
															-    stride = output.shape[1] // an_num
														
 
															-    for m in range(an_num):
														
 
															-        clss.append(
														
 
															-            fluid.layers.slice(
														
 
															-                output,
														
 
															-                axes=[1],
														
 
															-                starts=[stride * m + 5],
														
 
															-                ends=[stride * m + 5 + num_classes]))
														
 
															-    cls = fluid.layers.transpose(
														
 
															-        fluid.layers.stack(
														
 
															-            clss, axis=1), perm=[0, 1, 3, 4, 2])
														
 
															-    return (x, y, w, h, obj, cls)
														
 
															-
														
 
															-
														
 
															-def _split_target(target):
														
 
															-    """
														
 
															-    split target to x, y, w, h, objectness, classification
														
 
															-    along dimension 2
														
 
															-    target is in shape [N, an_num, 6 + class_num, H, W]
														
 
															-    """
														
 
															-    tx = target[:, :, 0, :, :]
														
 
															-    ty = target[:, :, 1, :, :]
														
 
															-    tw = target[:, :, 2, :, :]
														
 
															-    th = target[:, :, 3, :, :]
														
 
															-    tscale = target[:, :, 4, :, :]
														
 
															-    tobj = target[:, :, 5, :, :]
														
 
															-    tcls = fluid.layers.transpose(target[:, :, 6:, :, :], perm=[0, 1, 3, 4, 2])
														
 
															-    tcls.stop_gradient = True
														
 
															-    return (tx, ty, tw, th, tscale, tobj, tcls)
														
 
															-
														
 
															-
														
 
															-def _calc_obj_loss(output, obj, tobj, gt_box, batch_size, anchors, num_classes,
														
 
															-                   downsample, ignore_thresh, scale_x_y):
														
 
															-    # A prediction bbox overlap any gt_bbox over ignore_thresh,
														
 
															-    # objectness loss will be ignored, process as follows:
														
 
															-    # 1. get pred bbox, which is same with YOLOv3 infer mode, use yolo_box here
														
 
															-    # NOTE: img_size is set as 1.0 to get noramlized pred bbox
														
 
															-    bbox, prob = fluid.layers.yolo_box(
														
 
															-        x=output,
														
 
															-        img_size=fluid.layers.ones(
														
 
															-            shape=[batch_size, 2], dtype="int32"),
														
 
															-        anchors=anchors,
														
 
															-        class_num=num_classes,
														
 
															-        conf_thresh=0.,
														
 
															-        downsample_ratio=downsample,
														
 
															-        clip_bbox=False,
														
 
															-        scale_x_y=scale_x_y)
														
 
															-    # 2. split pred bbox and gt bbox by sample, calculate IoU between pred bbox
														
 
															-    #    and gt bbox in each sample
														
 
															-    if batch_size > 1:
														
 
															-        preds = fluid.layers.split(bbox, batch_size, dim=0)
														
 
															-        gts = fluid.layers.split(gt_box, batch_size, dim=0)
														
 
															-    else:
														
 
															-        preds = [bbox]
														
 
															-        gts = [gt_box]
														
 
															-        probs = [prob]
														
 
															-    ious = []
														
 
															-    for pred, gt in zip(preds, gts):
														
 
															-
														
 
															-        def box_xywh2xyxy(box):
														
 
															-            x = box[:, 0]
														
 
															-            y = box[:, 1]
														
 
															-            w = box[:, 2]
														
 
															-            h = box[:, 3]
														
 
															-            return fluid.layers.stack(
														
 
															-                [
														
 
															-                    x - w / 2.,
														
 
															-                    y - h / 2.,
														
 
															-                    x + w / 2.,
														
 
															-                    y + h / 2.,
														
 
															-                ], axis=1)
														
 
															-
														
 
															-        pred = fluid.layers.squeeze(pred, axes=[0])
														
 
															-        gt = box_xywh2xyxy(fluid.layers.squeeze(gt, axes=[0]))
														
 
															-        ious.append(fluid.layers.iou_similarity(pred, gt))
														
 
															-    iou = fluid.layers.stack(ious, axis=0)
														
 
															-    # 3. Get iou_mask by IoU between gt bbox and prediction bbox,
														
 
															-    #    Get obj_mask by tobj(holds gt_score), calculate objectness loss
														
 
															-    max_iou = fluid.layers.reduce_max(iou, dim=-1)
														
 
															-    iou_mask = fluid.layers.cast(max_iou <= ignore_thresh, dtype="float32")
														
 
															-    output_shape = fluid.layers.shape(output)
														
 
															-    an_num = len(anchors) // 2
														
 
															-    iou_mask = fluid.layers.reshape(iou_mask, (-1, an_num, output_shape[2],
														
 
															-                                               output_shape[3]))
														
 
															-    iou_mask.stop_gradient = True
														
 
															-    # NOTE: tobj holds gt_score, obj_mask holds object existence mask
														
 
															-    obj_mask = fluid.layers.cast(tobj > 0., dtype="float32")
														
 
															-    obj_mask.stop_gradient = True
														
 
															-    # For positive objectness grids, objectness loss should be calculated
														
 
															-    # For negative objectness grids, objectness loss is calculated only iou_mask == 1.0
														
 
															-    loss_obj = fluid.layers.sigmoid_cross_entropy_with_logits(obj, obj_mask)
														
 
															-    loss_obj_pos = fluid.layers.reduce_sum(loss_obj * tobj, dim=[1, 2, 3])
														
 
															-    loss_obj_neg = fluid.layers.reduce_sum(
														
 
															-        loss_obj * (1.0 - obj_mask) * iou_mask, dim=[1, 2, 3])
														
 
															-    return loss_obj_pos, loss_obj_neg
														
 
															-
														
 
															-
														
 
															-def fine_grained_loss(output,
														
 
															-                      target,
														
 
															-                      gt_box,
														
 
															-                      batch_size,
														
 
															-                      num_classes,
														
 
															-                      anchors,
														
 
															-                      ignore_thresh,
														
 
															-                      downsample,
														
 
															-                      scale_x_y=1.,
														
 
															-                      eps=1e-10):
														
 
															-    an_num = len(anchors) // 2
														
 
															-    x, y, w, h, obj, cls = _split_output(output, an_num, num_classes)
														
 
															-    tx, ty, tw, th, tscale, tobj, tcls = _split_target(target)
														
 
															-
														
 
															-    tscale_tobj = tscale * tobj
														
 
															-
														
 
															-    scale_x_y = scale_x_y
														
 
															-
														
 
															-    if (abs(scale_x_y - 1.0) < eps):
														
 
															-        loss_x = fluid.layers.sigmoid_cross_entropy_with_logits(
														
 
															-            x, tx) * tscale_tobj
														
 
															-        loss_x = fluid.layers.reduce_sum(loss_x, dim=[1, 2, 3])
														
 
															-        loss_y = fluid.layers.sigmoid_cross_entropy_with_logits(
														
 
															-            y, ty) * tscale_tobj
														
 
															-        loss_y = fluid.layers.reduce_sum(loss_y, dim=[1, 2, 3])
														
 
															-    else:
														
 
															-        dx = scale_x_y * fluid.layers.sigmoid(x) - 0.5 * (scale_x_y - 1.0)
														
 
															-        dy = scale_x_y * fluid.layers.sigmoid(y) - 0.5 * (scale_x_y - 1.0)
														
 
															-        loss_x = fluid.layers.abs(dx - tx) * tscale_tobj
														
 
															-        loss_x = fluid.layers.reduce_sum(loss_x, dim=[1, 2, 3])
														
 
															-        loss_y = fluid.layers.abs(dy - ty) * tscale_tobj
														
 
															-        loss_y = fluid.layers.reduce_sum(loss_y, dim=[1, 2, 3])
														
 
															-
														
 
															-    # NOTE: we refined loss function of (w, h) as L1Loss
														
 
															-    loss_w = fluid.layers.abs(w - tw) * tscale_tobj
														
 
															-    loss_w = fluid.layers.reduce_sum(loss_w, dim=[1, 2, 3])
														
 
															-    loss_h = fluid.layers.abs(h - th) * tscale_tobj
														
 
															-    loss_h = fluid.layers.reduce_sum(loss_h, dim=[1, 2, 3])
														
 
															-
														
 
															-    loss_obj_pos, loss_obj_neg = _calc_obj_loss(
														
 
															-        output, obj, tobj, gt_box, batch_size, anchors, num_classes,
														
 
															-        downsample, ignore_thresh, scale_x_y)
														
 
															-
														
 
															-    loss_cls = fluid.layers.sigmoid_cross_entropy_with_logits(cls, tcls)
														
 
															-    loss_cls = fluid.layers.elementwise_mul(loss_cls, tobj, axis=0)
														
 
															-    loss_cls = fluid.layers.reduce_sum(loss_cls, dim=[1, 2, 3, 4])
														
 
															-
														
 
															-    loss_xys = fluid.layers.reduce_mean(loss_x + loss_y)
														
 
															-    loss_whs = fluid.layers.reduce_mean(loss_w + loss_h)
														
 
															-    loss_objs = fluid.layers.reduce_mean(loss_obj_pos + loss_obj_neg)
														
 
															-    loss_clss = fluid.layers.reduce_mean(loss_cls)
														
 
															-
														
 
															-    losses_all = {
														
 
															-        "loss_xy": fluid.layers.sum(loss_xys),
														
 
															-        "loss_wh": fluid.layers.sum(loss_whs),
														
 
															-        "loss_loc": fluid.layers.sum(loss_xys) + fluid.layers.sum(loss_whs),
														
 
															-        "loss_obj": fluid.layers.sum(loss_objs),
														
 
															-        "loss_cls": fluid.layers.sum(loss_clss),
														
 
															-    }
														
 
															-    return losses_all, x, y, tx, ty
														
 
															-
														
 
															-
														
 
															-def gt2yolotarget(gt_bbox, gt_class, gt_score, anchors, mask, num_classes,
														
 
															-                  size, stride):
														
 
															-    grid_h, grid_w = size
														
 
															-    h, w = grid_h * stride, grid_w * stride
														
 
															-    an_hw = np.array(anchors) / np.array([[w, h]])
														
 
															-    target = np.zeros(
														
 
															-        (len(mask), 6 + num_classes, grid_h, grid_w), dtype=np.float32)
														
 
															-    for b in range(gt_bbox.shape[0]):
														
 
															-        gx, gy, gw, gh = gt_bbox[b, :]
														
 
															-        cls = gt_class[b]
														
 
															-        score = gt_score[b]
														
 
															-        if gw <= 0. or gh <= 0. or score <= 0.:
														
 
															-            continue
														
 
															-
														
 
															-        # find best match anchor index
														
 
															-        best_iou = 0.
														
 
															-        best_idx = -1
														
 
															-        for an_idx in range(an_hw.shape[0]):
														
 
															-            iou = jaccard_overlap(
														
 
															-                [0., 0., gw, gh],
														
 
															-                [0., 0., an_hw[an_idx, 0], an_hw[an_idx, 1]])
														
 
															-            if iou > best_iou:
														
 
															-                best_iou = iou
														
 
															-                best_idx = an_idx
														
 
															-
														
 
															-        gi = int(gx * grid_w)
														
 
															-        gj = int(gy * grid_h)
														
 
															-
														
 
															-        # gtbox should be regresed in this layes if best match
														
 
															-        # anchor index in anchor mask of this layer
														
 
															-        if best_idx in mask:
														
 
															-            best_n = mask.index(best_idx)
														
 
															-
														
 
															-            # x, y, w, h, scale
														
 
															-            target[best_n, 0, gj, gi] = gx * grid_w - gi
														
 
															-            target[best_n, 1, gj, gi] = gy * grid_h - gj
														
 
															-            target[best_n, 2, gj, gi] = np.log(gw * w / anchors[best_idx][0])
														
 
															-            target[best_n, 3, gj, gi] = np.log(gh * h / anchors[best_idx][1])
														
 
															-            target[best_n, 4, gj, gi] = 2.0 - gw * gh
														
 
															-
														
 
															-            # objectness record gt_score
														
 
															-            # if target[best_n, 5, gj, gi] > 0:
														
 
															-            #     print('find 1 duplicate')
														
 
															-            target[best_n, 5, gj, gi] = score
														
 
															-
														
 
															-            # classification
														
 
															-            target[best_n, 6 + cls, gj, gi] = 1.
														
 
															-
														
 
															-    return target
														
 
															-
														
 
															-
														
 
															-class TestYolov3LossOp(unittest.TestCase):
														
 
															-    def setUp(self):
														
 
															-        self.initTestCase()
														
 
															-        x = np.random.uniform(0, 1, self.x_shape).astype('float64')
														
 
															-        gtbox = np.random.random(size=self.gtbox_shape).astype('float64')
														
 
															-        gtlabel = np.random.randint(0, self.class_num, self.gtbox_shape[:2])
														
 
															-        gtmask = np.random.randint(0, 2, self.gtbox_shape[:2])
														
 
															-        gtbox = gtbox * gtmask[:, :, np.newaxis]
														
 
															-        gtlabel = gtlabel * gtmask
														
 
															-
														
 
															-        gtscore = np.ones(self.gtbox_shape[:2]).astype('float64')
														
 
															-        if self.gtscore:
														
 
															-            gtscore = np.random.random(self.gtbox_shape[:2]).astype('float64')
														
 
															-
														
 
															-        target = []
														
 
															-        for box, label, score in zip(gtbox, gtlabel, gtscore):
														
 
															-            target.append(
														
 
															-                gt2yolotarget(box, label, score, self.anchors,
														
 
															-                              self.anchor_mask, self.class_num, (
														
 
															-                                  self.h, self.w), self.downsample_ratio))
														
 
															-
														
 
															-        self.target = np.array(target).astype('float64')
														
 
															-
														
 
															-        self.mask_anchors = []
														
 
															-        for i in self.anchor_mask:
														
 
															-            self.mask_anchors.extend(self.anchors[i])
														
 
															-        self.x = x
														
 
															-        self.gtbox = gtbox
														
 
															-        self.gtlabel = gtlabel
														
 
															-        self.gtscore = gtscore
														
 
															-
														
 
															-    def initTestCase(self):
														
 
															-        self.b = 8
														
 
															-        self.h = 19
														
 
															-        self.w = 19
														
 
															-        self.anchors = [[10, 13], [16, 30], [33, 23], [30, 61], [62, 45],
														
 
															-                        [59, 119], [116, 90], [156, 198], [373, 326]]
														
 
															-        self.anchor_mask = [6, 7, 8]
														
 
															-        self.na = len(self.anchor_mask)
														
 
															-        self.class_num = 80
														
 
															-        self.ignore_thresh = 0.7
														
 
															-        self.downsample_ratio = 32
														
 
															-        self.x_shape = (self.b, len(self.anchor_mask) * (5 + self.class_num),
														
 
															-                        self.h, self.w)
														
 
															-        self.gtbox_shape = (self.b, 40, 4)
														
 
															-        self.gtscore = True
														
 
															-        self.use_label_smooth = False
														
 
															-        self.scale_x_y = 1.
														
 
															-
														
 
															-    def test_loss(self):
														
 
															-        x, gtbox, gtlabel, gtscore, target = self.x, self.gtbox, self.gtlabel, self.gtscore, self.target
														
 
															-        yolo_loss = YOLOv3Loss(
														
 
															-            ignore_thresh=self.ignore_thresh,
														
 
															-            label_smooth=self.use_label_smooth,
														
 
															-            num_classes=self.class_num,
														
 
															-            downsample=self.downsample_ratio,
														
 
															-            scale_x_y=self.scale_x_y)
														
 
															-        x = paddle.to_tensor(x.astype(np.float32))
														
 
															-        gtbox = paddle.to_tensor(gtbox.astype(np.float32))
														
 
															-        gtlabel = paddle.to_tensor(gtlabel.astype(np.float32))
														
 
															-        gtscore = paddle.to_tensor(gtscore.astype(np.float32))
														
 
															-        t = paddle.to_tensor(target.astype(np.float32))
														
 
															-        anchor = [self.anchors[i] for i in self.anchor_mask]
														
 
															-        (yolo_loss1, px, py, tx, ty) = fine_grained_loss(
														
 
															-            output=x,
														
 
															-            target=t,
														
 
															-            gt_box=gtbox,
														
 
															-            batch_size=self.b,
														
 
															-            num_classes=self.class_num,
														
 
															-            anchors=self.mask_anchors,
														
 
															-            ignore_thresh=self.ignore_thresh,
														
 
															-            downsample=self.downsample_ratio,
														
 
															-            scale_x_y=self.scale_x_y)
														
 
															-        yolo_loss2 = yolo_loss.yolov3_loss(
														
 
															-            x, t, gtbox, anchor, self.downsample_ratio, self.scale_x_y)
														
 
															-        for k in yolo_loss2:
														
 
															-            self.assertAlmostEqual(
														
 
															-                yolo_loss1[k].numpy()[0],
														
 
															-                yolo_loss2[k].numpy()[0],
														
 
															-                delta=1e-2,
														
 
															-                msg=k)
														
 
															-
														
 
															-
														
 
															-class TestYolov3LossNoGTScore(TestYolov3LossOp):
														
 
															-    def initTestCase(self):
														
 
															-        self.b = 1
														
 
															-        self.h = 76
														
 
															-        self.w = 76
														
 
															-        self.anchors = [[10, 13], [16, 30], [33, 23], [30, 61], [62, 45],
														
 
															-                        [59, 119], [116, 90], [156, 198], [373, 326]]
														
 
															-        self.anchor_mask = [0, 1, 2]
														
 
															-        self.na = len(self.anchor_mask)
														
 
															-        self.class_num = 80
														
 
															-        self.ignore_thresh = 0.7
														
 
															-        self.downsample_ratio = 8
														
 
															-        self.x_shape = (self.b, len(self.anchor_mask) * (5 + self.class_num),
														
 
															-                        self.h, self.w)
														
 
															-        self.gtbox_shape = (self.b, 40, 4)
														
 
															-        self.gtscore = False
														
 
															-        self.use_label_smooth = False
														
 
															-        self.scale_x_y = 1.
														
 
															-
														
 
															-
														
 
															-class TestYolov3LossWithScaleXY(TestYolov3LossOp):
														
 
															-    def initTestCase(self):
														
 
															-        self.b = 5
														
 
															-        self.h = 38
														
 
															-        self.w = 38
														
 
															-        self.anchors = [[10, 13], [16, 30], [33, 23], [30, 61], [62, 45],
														
 
															-                        [59, 119], [116, 90], [156, 198], [373, 326]]
														
 
															-        self.anchor_mask = [3, 4, 5]
														
 
															-        self.na = len(self.anchor_mask)
														
 
															-        self.class_num = 80
														
 
															-        self.ignore_thresh = 0.7
														
 
															-        self.downsample_ratio = 16
														
 
															-        self.x_shape = (self.b, len(self.anchor_mask) * (5 + self.class_num),
														
 
															-                        self.h, self.w)
														
 
															-        self.gtbox_shape = (self.b, 40, 4)
														
 
															-        self.gtscore = True
														
 
															-        self.use_label_smooth = False
														
 
															-        self.scale_x_y = 1.2
														
 
															-
														
 
															-
														
 
															-if __name__ == "__main__":
														
 
															-    unittest.main()
														
--- a/paddlex/ppdet/optimizer.py
+++ b/paddlex/ppdet/optimizer.py
@@ -42,9 +42,10 @@ class CosineDecay(object):
 
															             the max_iters is much larger than the warmup iter
														
 
															     """
														
 
															-    def __init__(self, max_epochs=1000, use_warmup=True):
														
 
															+    def __init__(self, max_epochs=1000, use_warmup=True, eta_min=0):
														
 
															         self.max_epochs = max_epochs
														
 
															         self.use_warmup = use_warmup
														
 
															+        self.eta_min = eta_min
														
 
															     def __call__(self,
														
 
															                  base_lr=None,
														
@@ -66,7 +67,8 @@ class CosineDecay(object):
 
															                 value.append(decayed_lr)
														
 
															             return optimizer.lr.PiecewiseDecay(boundary, value)
														
 
															-        return optimizer.lr.CosineAnnealingDecay(base_lr, T_max=max_iters)
														
 
															+        return optimizer.lr.CosineAnnealingDecay(
														
 
															+            base_lr, T_max=max_iters, eta_min=self.eta_min)
														
 
															 @serializable
														
--- a/paddlex/ppdet/utils/checkpoint.py
+++ b/paddlex/ppdet/utils/checkpoint.py
@@ -124,7 +124,7 @@ def match_state_dict(model_state_dict, weight_state_dict):
 
															     weight_keys = sorted(weight_state_dict.keys())
														
 
															     def match(a, b):
														
 
															-        if a.startswith('backbone.res5'):
														
 
															+        if b.startswith('backbone.res5'):
														
 
															             # In Faster RCNN, res5 pretrained weights have prefix of backbone,
														
 
															             # however, the corresponding model weights have difficult prefix,
														
 
															             # bbox_head.
														
@@ -139,10 +139,14 @@ def match_state_dict(model_state_dict, weight_state_dict):
 
															     max_id = match_matrix.argmax(1)
														
 
															     max_len = match_matrix.max(1)
														
 
															     max_id[max_len == 0] = -1
														
 
															+
														
 
															+    load_id = set(max_id)
														
 
															+    load_id.discard(-1)
														
 
															     not_load_weight_name = []
														
 
															-    for match_idx in range(len(max_id)):
														
 
															-        if match_idx < len(weight_keys) and max_id[match_idx] == -1:
														
 
															-            not_load_weight_name.append(weight_keys[match_idx])
														
 
															+    for idx in range(len(weight_keys)):
														
 
															+        if idx not in load_id:
														
 
															+            not_load_weight_name.append(weight_keys[idx])
														
 
															+
														
 
															     if len(not_load_weight_name) > 0:
														
 
															         logger.info('{} in pretrained weight is not used in the model, '
														
 
															                     'and its will not be loaded'.format(not_load_weight_name))
														
--- a/paddlex/utils/checkpoint.py
+++ b/paddlex/utils/checkpoint.py
@@ -85,6 +85,28 @@ cityscapes_weights = {
 
															 }
														
 
															 imagenet_weights = {
														
 
															+    'PPLCNet_x0_25_IMAGENET':
														
 
															+    'https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/legendary_models/PPLCNet_x0_25_pretrained.pdparams',
														
 
															+    'PPLCNet_x0_35_IMAGENET':
														
 
															+    'https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/legendary_models/PPLCNet_x0_35_pretrained.pdparams',
														
 
															+    'PPLCNet_x0_5_IMAGENET':
														
 
															+    'https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/legendary_models/PPLCNet_x0_5_pretrained.pdparams',
														
 
															+    'PPLCNet_x0_75_IMAGENET':
														
 
															+    'https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/legendary_models/PPLCNet_x0_75_pretrained.pdparams',
														
 
															+    'PPLCNet_x1_0_IMAGENET':
														
 
															+    'https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/legendary_models/PPLCNet_x1_0_pretrained.pdparams',
														
 
															+    'PPLCNet_x1_5_IMAGENET':
														
 
															+    'https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/legendary_models/PPLCNet_x1_5_pretrained.pdparams',
														
 
															+    'PPLCNet_x2_0_IMAGENET':
														
 
															+    'https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/legendary_models/PPLCNet_x2_0_pretrained.pdparams',
														
 
															+    'PPLCNet_x2_5_IMAGENET':
														
 
															+    'https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/legendary_models/PPLCNet_x2_5_pretrained.pdparams',
														
 
															+    'PPLCNet_x0_5_ssld_IMAGENET':
														
 
															+    'https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/legendary_models/PPLCNet_x0_5_ssld_pretrained.pdparams',
														
 
															+    'PPLCNet_x1_0_ssld_IMAGENET':
														
 
															+    'https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/legendary_models/PPLCNet_x1_0_ssld_pretrained.pdparams',
														
 
															+    'PPLCNet_x2_5_ssld_IMAGENET':
														
 
															+    'https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/legendary_models/PPLCNet_x2_5_ssld_pretrained.pdparams',
														
 
															     'ResNet18_IMAGENET':
														
 
															     'https://paddle-imagenet-models-name.bj.bcebos.com/dygraph/legendary_models/ResNet18_pretrained.pdparams',
														
 
															     'ResNet34_IMAGENET':
														
--- a/paddlex_restful/restful/app.py
+++ b/paddlex_restful/restful/app.py
@@ -569,9 +569,6 @@ def task_evaluate():
 
															         ret = get_evaluate_result(data, SD.workspace)
														
 
															         if ret['evaluate_status'] == TaskStatus.XEVALUATED and ret[
														
 
															                 'result'] is not None:
														
 
															-            if 'Confusion_Matrix' in ret['result']:
														
 
															-                ret['result']['Confusion_Matrix'] = ret['result'][
														
 
															-                    'Confusion_Matrix']
														
 
															             ret['result'] = CustomEncoder().encode(ret['result'])
														
 
															             ret['result'] = json.loads(ret['result'])
														
 
															         ret['evaluate_status'] = ret['evaluate_status'].value
														
@@ -893,16 +890,11 @@ def model():
 
															                 return ret
														
 
															         from .model import get_model_details
														
 
															         ret = get_model_details(data, SD.workspace)
														
 
															-        ret['eval_result']['Confusion_Matrix'] = ret['eval_result'][
														
 
															-            'Confusion_Matrix'].tolist()
														
 
															         ret['eval_result'] = CustomEncoder().encode(ret['eval_result'])
														
 
															         ret['task_params'] = CustomEncoder().encode(ret['task_params'])
														
 
															         return ret
														
 
															     if request.method == 'POST':
														
 
															         if data['type'] == 'pretrained':
														
 
															-            if 'eval_results' in data:
														
 
															-                data['eval_results']['Confusion_Matrix'] = np.array(data[
														
 
															-                    'eval_results']['Confusion_Matrix'])
														
 
															             from .model import create_pretrained_model
														
 
															             ret = create_pretrained_model(data, SD.workspace,
														
 
															                                           SD.monitored_processes)
														
--- a/paddlex_restful/restful/project/train/classification.py
+++ b/paddlex_restful/restful/project/train/classification.py
@@ -70,7 +70,7 @@ def build_optimizer(parameters, step_each_epoch, params):
 
															     num_epochs = params.num_epochs
														
 
															     if params.lr_policy == 'Cosine':
														
 
															         learning_rate = paddle.optimizer.lr.CosineAnnealingDecay(
														
 
															-            learning_rate=.001, T_max=step_each_epoch * num_epochs)
														
 
															+            learning_rate=learning_rate, T_max=step_each_epoch * num_epochs)
														
 
															     elif params.lr_policy == 'Linear':
														
 
															         learning_rate = paddle.optimizer.lr.PolynomialDecay(
														
 
															             learning_rate=learning_rate,
														
--- a/paddlex_restful/restful/project/train/detection.py
+++ b/paddlex_restful/restful/project/train/detection.py
@@ -90,6 +90,40 @@ def build_rcnn_transforms(params):
 
															     return train_transforms, eval_transforms
														
 
															+def build_pico_transforms(params):
														
 
															+    from paddlex import transforms as T
														
 
															+    target_size = params.image_shape[0]
														
 
															+    dt_list = []
														
 
															+    dt_list.extend([
														
 
															+        T.RandomDistort(
														
 
															+            brightness_range=params.brightness_range,
														
 
															+            brightness_prob=params.brightness_prob,
														
 
															+            contrast_range=params.contrast_range,
														
 
															+            contrast_prob=params.contrast_prob,
														
 
															+            saturation_range=params.saturation_range,
														
 
															+            saturation_prob=params.saturation_prob,
														
 
															+            hue_range=params.hue_range,
														
 
															+            hue_prob=params.hue_prob),
														
 
															+    ])
														
 
															+    crop_image = params.crop_image
														
 
															+    if crop_image:
														
 
															+        dt_list.append(T.RandomCrop())
														
 
															+    dt_list.extend([
														
 
															+        T.Resize(
														
 
															+            target_size=target_size, interp='RANDOM'),
														
 
															+        T.RandomHorizontalFlip(prob=params.horizontal_flip_prob), T.Normalize(
														
 
															+            mean=params.image_mean, std=params.image_std)
														
 
															+    ])
														
 
															+    train_transforms = T.Compose(dt_list)
														
 
															+    eval_transforms = T.Compose([
														
 
															+        T.Resize(
														
 
															+            target_size=target_size, interp='CUBIC'),
														
 
															+        T.Normalize(
														
 
															+            mean=params.image_mean, std=params.image_std),
														
 
															+    ])
														
 
															+    return train_transforms, eval_transforms
														
 
															+
														
 
															+
														
 
															 def build_voc_datasets(dataset_path, train_transforms, eval_transforms):
														
 
															     import paddlex as pdx
														
 
															     train_file_list = osp.join(dataset_path, 'train_list.txt')
														
@@ -157,6 +191,8 @@ def train(task_path, dataset_path, params):
 
															     pdx.log_level = 3
														
 
															     if params.model in ['YOLOv3', 'PPYOLO', 'PPYOLOTiny', 'PPYOLOv2']:
														
 
															         train_transforms, eval_transforms = build_yolo_transforms(params)
														
 
															+    elif params.model in ['PicoDet']:
														
 
															+        train_transforms, eval_transforms = build_pico_transforms(params)
														
 
															     elif params.model in ['FasterRCNN', 'MaskRCNN']:
														
 
															         train_transforms, eval_transforms = build_rcnn_transforms(params)
														
 
															     if osp.exists(osp.join(dataset_path, 'JPEGImages')) and \
														
@@ -194,7 +230,8 @@ def train(task_path, dataset_path, params):
 
															         # prune
														
 
															         dataset = eval_dataset or train_dataset
														
 
															         im_shape = dataset[0]['image'].shape[:2]
														
 
															-        if getattr(model, 'with_fpn', False):
														
 
															+        if getattr(model, 'with_fpn',
														
 
															+                   False) or model.__class__.__name__ == 'PicoDet':
														
 
															             im_shape[0] = int(np.ceil(im_shape[0] / 32) * 32)
														
 
															             im_shape[1] = int(np.ceil(im_shape[1] / 32) * 32)
														
 
															         inputs = [{
														
--- a/requirements.txt
+++ b/requirements.txt
@@ -4,9 +4,9 @@ colorama
 
															 cython
														
 
															 pycocotools
														
 
															 visualdl >= 2.1.1
														
 
															-paddleslim == 2.1.1
														
 
															+paddleslim == 2.2.1
														
 
															 shapely
														
 
															-paddlepaddle-gpu == 2.2.0
														
 
															+paddlepaddle-gpu >= 2.2.0
														
 
															 opencv-python
														
 
															 scikit-learn==0.23.2
														
 
															 lap
														
--- a/setup.py
+++ b/setup.py
@@ -13,13 +13,12 @@
 
															 # limitations under the License.
														
 
															 import setuptools
														
 
															-import sys
														
 
															-long_description = "PaddlePaddle Entire Process Development Toolkit"
														
 
															+long_description = "PaddlePaddle End-to-End Development Toolkit"
														
 
															 setuptools.setup(
														
 
															     name="paddlex",
														
 
															-    version='2.0.0',
														
 
															+    version='2.1.0',
														
 
															     author="paddlex",
														
 
															     author_email="paddlex@baidu.com",
														
 
															     description=long_description,
														
@@ -38,9 +37,10 @@ setuptools.setup(
 
															     include_data_files=True,
														
 
															     setup_requires=['cython', 'numpy'],
														
 
															     install_requires=[
														
 
															-        "pycocotools", 'pyyaml', 'colorama', 'tqdm', 'paddleslim==2.1.1',
														
 
															-        'visualdl>=2.1.1', 'shapely>=1.7.0', 'opencv-python', 'scipy', 'lap',
														
 
															-        'motmetrics', 'scikit-learn==0.23.2', 'chardet', 'flask_cors'
														
 
															+        "pycocotools", 'pyyaml', 'colorama', 'tqdm', 'paddleslim==2.2.1',
														
 
															+        'visualdl>=2.2.2', 'shapely>=1.7.0', 'opencv-python', 'scipy', 'lap',
														
 
															+        'motmetrics', 'scikit-learn==0.23.2', 'chardet', 'flask_cors',
														
 
															+        'openpyxl'
														
 
															     ],
														
 
															     classifiers=[
														
 
															         "Programming Language :: Python :: 3",
														
--- a/static/docs/apis/visualize.md
+++ b/static/docs/apis/visualize.md
@@ -151,7 +151,7 @@ paddlex.det.coco_error_analysis(eval_details_file=None, gt=None, pred_bbox=None,
 
															 ![](images/detection_analysis.jpg)
														
 
															-左图显示的是`person`类的分析结果，有图显示的是所有类别整体的分析结果。
														
 
															+左图显示的是`person`类的分析结果，右图显示的是所有类别整体的分析结果。
														
 
															 分析图表展示了7条Precision-Recall（PR）曲线，每一条曲线表示的Average Precision （AP）比它左边那条高，原因是逐步放宽了评估要求。以`person`类为例，各条PR曲线的评估要求解释如下：
														
--- a/tutorials/train/image_classification/pplcnet.py
+++ b/tutorials/train/image_classification/pplcnet.py
@@ -0,0 +1,50 @@
 
															+import paddlex as pdx
														
 
															+from paddlex import transforms as T
														
 
															+
														
 
															+# 下载和解压蔬菜分类数据集
														
 
															+veg_dataset = 'https://bj.bcebos.com/paddlex/datasets/vegetables_cls.tar.gz'
														
 
															+pdx.utils.download_and_decompress(veg_dataset, path='./')
														
 
															+
														
 
															+# 定义训练和验证时的transforms
														
 
															+# API说明：https://github.com/PaddlePaddle/PaddleX/blob/develop/docs/apis/transforms/transforms.md
														
 
															+train_transforms = T.Compose(
														
 
															+    [T.RandomCrop(crop_size=224), T.RandomHorizontalFlip(), T.Normalize()])
														
 
															+
														
 
															+eval_transforms = T.Compose([
														
 
															+    T.ResizeByShort(short_size=256), T.CenterCrop(crop_size=224), T.Normalize()
														
 
															+])
														
 
															+
														
 
															+# 定义训练和验证所用的数据集
														
 
															+# API说明：https://github.com/PaddlePaddle/PaddleX/blob/develop/docs/apis/datasets.md
														
 
															+train_dataset = pdx.datasets.ImageNet(
														
 
															+    data_dir='vegetables_cls',
														
 
															+    file_list='vegetables_cls/train_list.txt',
														
 
															+    label_list='vegetables_cls/labels.txt',
														
 
															+    transforms=train_transforms,
														
 
															+    shuffle=True)
														
 
															+
														
 
															+eval_dataset = pdx.datasets.ImageNet(
														
 
															+    data_dir='vegetables_cls',
														
 
															+    file_list='vegetables_cls/val_list.txt',
														
 
															+    label_list='vegetables_cls/labels.txt',
														
 
															+    transforms=eval_transforms)
														
 
															+
														
 
															+# 初始化模型，并进行训练
														
 
															+# 可使用VisualDL查看训练指标，参考https://github.com/PaddlePaddle/PaddleX/blob/develop/docs/visualdl.md
														
 
															+num_classes = len(train_dataset.labels)
														
 
															+model = pdx.cls.PPLCNet(num_classes=num_classes, scale=1)
														
 
															+
														
 
															+# API说明：https://github.com/PaddlePaddle/PaddleX/blob/develop/docs/apis/models/classification.md
														
 
															+# 各参数介绍与调整说明：https://github.com/PaddlePaddle/PaddleX/tree/develop/docs/parameters.md
														
 
															+model.train(
														
 
															+    num_epochs=10,
														
 
															+    pretrain_weights='IMAGENET',
														
 
															+    train_dataset=train_dataset,
														
 
															+    train_batch_size=64,
														
 
															+    eval_dataset=eval_dataset,
														
 
															+    lr_decay_epochs=[4, 6, 8],
														
 
															+    learning_rate=0.1,
														
 
															+    save_dir='output/pplcnet',
														
 
															+    log_interval_steps=10,
														
 
															+    label_smoothing=.1,
														
 
															+    use_vdl=True)
														
--- a/tutorials/train/object_detection/picodet.py
+++ b/tutorials/train/object_detection/picodet.py
@@ -44,15 +44,16 @@ model = pdx.det.PicoDet(num_classes=num_classes, backbone='ESNet_l')
 
															 # API说明：https://github.com/PaddlePaddle/PaddleX/blob/develop/docs/apis/models/detection.md
														
 
															 # 各参数介绍与调整说明：https://github.com/PaddlePaddle/PaddleX/blob/develop/docs/parameters.md
														
 
															 model.train(
														
 
															-    num_epochs=300,
														
 
															+    num_epochs=20,
														
 
															     train_dataset=train_dataset,
														
 
															-    train_batch_size=7,
														
 
															+    train_batch_size=14,
														
 
															     eval_dataset=eval_dataset,
														
 
															     pretrain_weights='COCO',
														
 
															     learning_rate=.05,
														
 
															-    warmup_steps=300,
														
 
															-    warmup_start_lr=0.0,
														
 
															-    save_interval_epochs=5,
														
 
															-    lr_decay_epochs=[85, 135],
														
 
															-    save_dir='output/piconet_esnet_l',
														
 
															+    warmup_steps=24,
														
 
															+    warmup_start_lr=0.005,
														
 
															+    save_interval_epochs=1,
														
 
															+    lr_decay_epochs=[6, 8, 11],
														
 
															+    use_ema=True,
														
 
															+    save_dir='output/picodet_esnet_l',
														
 
															     use_vdl=True)
	`@@ -1 +1 @@`
	`-Subproject commit d41b085d66946219351d8d99c2b3d95756489624`
			`+Subproject commit 692d732994660ceba82c75034c802eb1138239cf`