utils.cc 5.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160
  1. // Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved.
  2. //
  3. // Licensed under the Apache License, Version 2.0 (the "License");
  4. // you may not use this file except in compliance with the License.
  5. // You may obtain a copy of the License at
  6. //
  7. // http://www.apache.org/licenses/LICENSE-2.0
  8. //
  9. // Unless required by applicable law or agreed to in writing, software
  10. // distributed under the License is distributed on an "AS IS" BASIS,
  11. // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. // See the License for the specific language governing permissions and
  13. // limitations under the License.
  14. #include "ultra_infer/runtime/backends/tensorrt/utils.h"
  15. namespace ultra_infer {
  16. int ShapeRangeInfo::Update(const std::vector<int64_t> &new_shape) {
  17. if (new_shape.size() != shape.size()) {
  18. return -1;
  19. }
  20. int need_update_engine = 0;
  21. for (size_t i = 0; i < shape.size(); ++i) {
  22. if (is_static[i] == 1 && new_shape[i] != shape[i]) {
  23. return -1;
  24. }
  25. if (new_shape[i] < min[i] || min[i] < 0) {
  26. need_update_engine = 1;
  27. }
  28. if (new_shape[i] > max[i] || max[i] < 0) {
  29. need_update_engine = 1;
  30. }
  31. }
  32. if (need_update_engine == 0) {
  33. return 0;
  34. }
  35. FDWARNING << "[New Shape Out of Range] input name: " << name
  36. << ", shape: " << new_shape
  37. << ", The shape range before: min_shape=" << min
  38. << ", max_shape=" << max << "." << std::endl;
  39. for (size_t i = 0; i < shape.size(); ++i) {
  40. if (new_shape[i] < min[i] || min[i] < 0) {
  41. min[i] = new_shape[i];
  42. }
  43. if (new_shape[i] > max[i] || max[i] < 0) {
  44. max[i] = new_shape[i];
  45. }
  46. }
  47. FDWARNING
  48. << "[New Shape Out of Range] The updated shape range now: min_shape="
  49. << min << ", max_shape=" << max << "." << std::endl;
  50. return need_update_engine;
  51. }
  52. size_t TrtDataTypeSize(const nvinfer1::DataType &dtype) {
  53. if (dtype == nvinfer1::DataType::kFLOAT) {
  54. return sizeof(float);
  55. } else if (dtype == nvinfer1::DataType::kHALF) {
  56. return sizeof(float) / 2;
  57. } else if (dtype == nvinfer1::DataType::kINT8) {
  58. return sizeof(int8_t);
  59. } else if (dtype == nvinfer1::DataType::kINT32) {
  60. return sizeof(int32_t);
  61. }
  62. // kBOOL
  63. return sizeof(bool);
  64. }
  65. FDDataType GetFDDataType(const nvinfer1::DataType &dtype) {
  66. if (dtype == nvinfer1::DataType::kFLOAT) {
  67. return FDDataType::FP32;
  68. } else if (dtype == nvinfer1::DataType::kHALF) {
  69. return FDDataType::FP16;
  70. } else if (dtype == nvinfer1::DataType::kINT8) {
  71. return FDDataType::INT8;
  72. } else if (dtype == nvinfer1::DataType::kINT32) {
  73. return FDDataType::INT32;
  74. }
  75. // kBOOL
  76. return FDDataType::BOOL;
  77. }
  78. nvinfer1::DataType ReaderDtypeToTrtDtype(int reader_dtype) {
  79. if (reader_dtype == 0) {
  80. return nvinfer1::DataType::kFLOAT;
  81. } else if (reader_dtype == 1) {
  82. FDASSERT(false, "TensorRT cannot support data type of double now.");
  83. } else if (reader_dtype == 2) {
  84. FDASSERT(false, "TensorRT cannot support data type of uint8 now.");
  85. } else if (reader_dtype == 3) {
  86. return nvinfer1::DataType::kINT8;
  87. } else if (reader_dtype == 4) {
  88. return nvinfer1::DataType::kINT32;
  89. } else if (reader_dtype == 5) {
  90. // regard int64 as int32
  91. return nvinfer1::DataType::kINT32;
  92. } else if (reader_dtype == 6) {
  93. return nvinfer1::DataType::kHALF;
  94. }
  95. FDASSERT(false, "Received unexpected data type of %d", reader_dtype);
  96. return nvinfer1::DataType::kFLOAT;
  97. }
  98. FDDataType ReaderDtypeToFDDtype(int reader_dtype) {
  99. if (reader_dtype == 0) {
  100. return FDDataType::FP32;
  101. } else if (reader_dtype == 1) {
  102. return FDDataType::FP64;
  103. } else if (reader_dtype == 2) {
  104. return FDDataType::UINT8;
  105. } else if (reader_dtype == 3) {
  106. return FDDataType::INT8;
  107. } else if (reader_dtype == 4) {
  108. return FDDataType::INT32;
  109. } else if (reader_dtype == 5) {
  110. return FDDataType::INT64;
  111. } else if (reader_dtype == 6) {
  112. return FDDataType::FP16;
  113. }
  114. FDASSERT(false, "Received unexpected data type of %d", reader_dtype);
  115. return FDDataType::FP32;
  116. }
  117. std::vector<int> ToVec(const nvinfer1::Dims &dim) {
  118. std::vector<int> out(dim.d, dim.d + dim.nbDims);
  119. return out;
  120. }
  121. int64_t Volume(const nvinfer1::Dims &d) {
  122. return std::accumulate(d.d, d.d + d.nbDims, 1, std::multiplies<int64_t>());
  123. }
  124. nvinfer1::Dims ToDims(const std::vector<int> &vec) {
  125. int limit = static_cast<int>(nvinfer1::Dims::MAX_DIMS);
  126. if (static_cast<int>(vec.size()) > limit) {
  127. FDWARNING << "Vector too long, only first 8 elements are used in dimension."
  128. << std::endl;
  129. }
  130. // Pick first nvinfer1::Dims::MAX_DIMS elements
  131. nvinfer1::Dims dims{std::min(static_cast<int>(vec.size()), limit), {}};
  132. std::copy_n(vec.begin(), dims.nbDims, std::begin(dims.d));
  133. return dims;
  134. }
  135. nvinfer1::Dims ToDims(const std::vector<int64_t> &vec) {
  136. int limit = static_cast<int>(nvinfer1::Dims::MAX_DIMS);
  137. if (static_cast<int>(vec.size()) > limit) {
  138. FDWARNING << "Vector too long, only first 8 elements are used in dimension."
  139. << std::endl;
  140. }
  141. // Pick first nvinfer1::Dims::MAX_DIMS elements
  142. nvinfer1::Dims dims{std::min(static_cast<int>(vec.size()), limit), {}};
  143. std::copy_n(vec.begin(), dims.nbDims, std::begin(dims.d));
  144. return dims;
  145. }
  146. } // namespace ultra_infer