zhengchun
/
PaddleX


			
				
					
						
						
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268
							// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
#include "ultra_infer/pybind/main.h"

namespace ultra_infer {
void BindPPDet(pybind11::module &m) {
  pybind11::class_<vision::detection::PaddleDetPreprocessor,
                   vision::ProcessorManager>(m, "PaddleDetPreprocessor")
      .def(pybind11::init<std::string>())
      .def("run",
           [](vision::detection::PaddleDetPreprocessor &self,
              std::vector<pybind11::array> &im_list) {
             std::vector<vision::FDMat> images;
             for (size_t i = 0; i < im_list.size(); ++i) {
               images.push_back(vision::WrapMat(PyArrayToCvMat(im_list[i])));
             }
             std::vector<FDTensor> outputs;
             if (!self.Run(&images, &outputs)) {
               throw std::runtime_error(
                   "Failed to preprocess the input data in "
                   "PaddleDetPreprocessor.");
             }
             for (size_t i = 0; i < outputs.size(); ++i) {
               outputs[i].StopSharing();
             }
             return outputs;
           })
      .def("disable_normalize",
           [](vision::detection::PaddleDetPreprocessor &self) {
             self.DisableNormalize();
           })
      .def("disable_permute",
           [](vision::detection::PaddleDetPreprocessor &self) {
             self.DisablePermute();
           });

  pybind11::class_<vision::detection::NMSOption>(m, "NMSOption")
      .def(pybind11::init())
      .def_readwrite("background_label",
                     &vision::detection::NMSOption::background_label)
      .def_readwrite("keep_top_k", &vision::detection::NMSOption::keep_top_k)
      .def_readwrite("nms_eta", &vision::detection::NMSOption::nms_eta)
      .def_readwrite("nms_threshold",
                     &vision::detection::NMSOption::nms_threshold)
      .def_readwrite("nms_top_k", &vision::detection::NMSOption::nms_top_k)
      .def_readwrite("normalized", &vision::detection::NMSOption::normalized)
      .def_readwrite("score_threshold",
                     &vision::detection::NMSOption::score_threshold);

  pybind11::class_<vision::detection::PaddleDetPostprocessor>(
      m, "PaddleDetPostprocessor")
      .def(pybind11::init<>())
      .def(pybind11::init<std::string>())
      .def("run",
           [](vision::detection::PaddleDetPostprocessor &self,
              std::vector<FDTensor> &inputs) {
             std::vector<vision::DetectionResult> results;
             if (!self.Run(inputs, &results)) {
               throw std::runtime_error(
                   "Failed to postprocess the runtime result in "
                   "PaddleDetPostprocessor.");
             }
             return results;
           })
      .def("set_nms_option",
           [](vision::detection::PaddleDetPostprocessor &self,
              vision::detection::NMSOption option) {
             self.SetNMSOption(option);
           })
      .def("set_nms_rotated_option",
           [](vision::detection::PaddleDetPostprocessor &self,
              vision::detection::NMSRotatedOption option) {
             self.SetNMSRotatedOption(option);
           })
      .def("apply_nms",
           [](vision::detection::PaddleDetPostprocessor &self) {
             self.ApplyNMS();
           })
      .def("run", [](vision::detection::PaddleDetPostprocessor &self,
                     std::vector<pybind11::array> &input_array) {
        std::vector<vision::DetectionResult> results;
        std::vector<FDTensor> inputs;
        PyArrayToTensorList(input_array, &inputs, /*share_buffer=*/true);
        if (!self.Run(inputs, &results)) {
          throw std::runtime_error(
              "Failed to postprocess the runtime result in "
              "PaddleDetPostprocessor.");
        }
        return results;
      });

  pybind11::class_<vision::detection::PPDetBase, UltraInferModel>(m,
                                                                  "PPDetBase")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>())
      .def("predict",
           [](vision::detection::PPDetBase &self, pybind11::array &data) {
             auto mat = PyArrayToCvMat(data);
             vision::DetectionResult res;
             self.Predict(&mat, &res);
             return res;
           })
      .def("batch_predict",
           [](vision::detection::PPDetBase &self,
              std::vector<pybind11::array> &data) {
             std::vector<cv::Mat> images;
             for (size_t i = 0; i < data.size(); ++i) {
               images.push_back(PyArrayToCvMat(data[i]));
             }
             std::vector<vision::DetectionResult> results;
             self.BatchPredict(images, &results);
             return results;
           })
      .def("clone",
           [](vision::detection::PPDetBase &self) { return self.Clone(); })
      .def_property_readonly("preprocessor",
                             &vision::detection::PPDetBase::GetPreprocessor)
      .def_property_readonly("postprocessor",
                             &vision::detection::PPDetBase::GetPostprocessor);

  pybind11::class_<vision::detection::PPYOLO, vision::detection::PPDetBase>(
      m, "PPYOLO")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::PPYOLOE, vision::detection::PPDetBase>(
      m, "PPYOLOE")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::PicoDet, vision::detection::PPDetBase>(
      m, "PicoDet")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::PaddleYOLOX,
                   vision::detection::PPDetBase>(m, "PaddleYOLOX")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::FasterRCNN, vision::detection::PPDetBase>(
      m, "FasterRCNN")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::YOLOv3, vision::detection::PPDetBase>(
      m, "YOLOv3")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::MaskRCNN, vision::detection::PPDetBase>(
      m, "MaskRCNN")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::SSD, vision::detection::PPDetBase>(m,
                                                                         "SSD")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::PaddleYOLOv5,
                   vision::detection::PPDetBase>(m, "PaddleYOLOv5")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::PaddleYOLOv6,
                   vision::detection::PPDetBase>(m, "PaddleYOLOv6")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::PaddleYOLOv7,
                   vision::detection::PPDetBase>(m, "PaddleYOLOv7")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::PaddleYOLOv8,
                   vision::detection::PPDetBase>(m, "PaddleYOLOv8")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::RTMDet, vision::detection::PPDetBase>(
      m, "RTMDet")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::CascadeRCNN,
                   vision::detection::PPDetBase>(m, "CascadeRCNN")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::PSSDet, vision::detection::PPDetBase>(
      m, "PSSDet")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::RetinaNet, vision::detection::PPDetBase>(
      m, "RetinaNet")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::PPYOLOESOD, vision::detection::PPDetBase>(
      m, "PPYOLOESOD")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::FCOS, vision::detection::PPDetBase>(
      m, "FCOS")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::TTFNet, vision::detection::PPDetBase>(
      m, "TTFNet")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::TOOD, vision::detection::PPDetBase>(
      m, "TOOD")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::GFL, vision::detection::PPDetBase>(m,
                                                                         "GFL")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::SOLOv2, vision::detection::PPDetBase>(
      m, "SOLOv2")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::PaddleDetectionModel,
                   vision::detection::PPDetBase>(m, "PaddleDetectionModel")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::PPYOLOER, vision::detection::PPDetBase>(
      m, "PPYOLOER")
      .def(pybind11::init<std::string, std::string, std::string, RuntimeOption,
                          ModelFormat>());

  pybind11::class_<vision::detection::NMSRotatedOption>(m, "NMSRotatedOption")
      .def(pybind11::init())
      .def_readwrite("background_label",
                     &vision::detection::NMSRotatedOption::background_label)
      .def_readwrite("keep_top_k",
                     &vision::detection::NMSRotatedOption::keep_top_k)
      .def_readwrite("nms_eta", &vision::detection::NMSRotatedOption::nms_eta)
      .def_readwrite("nms_threshold",
                     &vision::detection::NMSRotatedOption::nms_threshold)
      .def_readwrite("nms_top_k",
                     &vision::detection::NMSRotatedOption::nms_top_k)
      .def_readwrite("normalized",
                     &vision::detection::NMSRotatedOption::normalized)
      .def_readwrite("score_threshold",
                     &vision::detection::NMSRotatedOption::score_threshold);
}
} // namespace ultra_infer