zhengchun
/
PaddleX


			
				
					
						
						
							12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182
							// Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once

#include <cstring>
#include <iostream>
#include <memory>
#include <string>
#include <vector>

#include "acl/acl.h"
#include "ultra_infer/core/fd_tensor.h"
#include "ultra_infer/runtime/backends/backend.h"

namespace ultra_infer {
class OmBackend : public BaseBackend {
public:
  OmBackend() = default;
  virtual ~OmBackend();

  // OM Backend implementation.
  bool Init(const RuntimeOption &runtime_option) override;

  int NumInputs() const override {
    return static_cast<int>(inputs_desc_.size());
  }
  int NumOutputs() const override {
    return static_cast<int>(outputs_desc_.size());
  }

  TensorInfo GetInputInfo(int index) override;
  TensorInfo GetOutputInfo(int index) override;
  std::vector<TensorInfo> GetInputInfos() override;
  std::vector<TensorInfo> GetOutputInfos() override;

  bool Infer(std::vector<FDTensor> &inputs, std::vector<FDTensor> *outputs,
             bool copy_to_fd = true) override;
  static bool aclInitFlag;

private:
  std::vector<TensorInfo> inputs_desc_;
  std::vector<TensorInfo> outputs_desc_;
  std::vector<void *> inputBuffer;
  std::vector<void *> outputBuffer;
  bool loadFlag_ = false; // model load flag
  int32_t deviceId_;
  uint32_t modelId_;
  size_t modelWorkSize_;   // model work memory buffer size
  size_t modelWeightSize_; // model weight memory buffer size
  void *modelWorkPtr_;     // model work memory buffer
  void *modelWeightPtr_;   // model weight memory buffer
  aclmdlDesc *modelDesc_;
  aclmdlDataset *input_;
  aclmdlDataset *output_;
  aclrtContext context_;
  aclrtStream stream_;

  bool LoadModel(const char *modelPath);
  bool Execute();
  bool CreateInput();
  void DestroyInput();
  bool CreateOutput();
  void DestroyOutput();
  void DestroyResource();
  bool CreateModelDesc();
  void FreeInputBuffer();
  void FreeOutputBuffer();
  bool InitResource();
};
} // namespace ultra_infer