You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

algos.h 8.8 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226
  1. /**
  2. * \file dnn/src/arm_common/conv_bias/int8/algos.h
  3. * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
  4. *
  5. * Copyright (c) 2014-2020 Megvii Inc. All rights reserved.
  6. *
  7. * Unless required by applicable law or agreed to in writing,
  8. * software distributed under the License is distributed on an
  9. * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or
  10. * implied.
  11. */
  12. #pragma once
  13. #include "src/arm_common/conv_bias/opr_impl.h"
  14. namespace megdnn {
  15. namespace arm_common {
  16. class ConvBiasImpl::AlgoS8DirectStride1 final : public AlgoBase {
  17. bool m_large_group;
  18. public:
  19. AlgoS8DirectStride1(bool large_group) : m_large_group(large_group) {}
  20. bool is_reproducible() const override { return true; }
  21. const char* name() const override {
  22. return m_large_group ? "S8STRD1_LARGE_GROUP" : "S8STRD1_SMALL_GROUP";
  23. }
  24. bool usable(const NCBKernSizeParam& param,
  25. AlgoSelectionStrategy algo_selection_strategy) const override;
  26. size_t get_workspace(const NCBKernSizeParam& param) const override;
  27. virtual SmallVector<NCBKern> dispatch_kerns(
  28. const NCBKernSizeParam& param) const override;
  29. bool is_preferred(const NCBKernSizeParam& param) const override;
  30. };
  31. class ConvBiasImpl::AlgoS8DirectStride2 final : public AlgoBase {
  32. bool m_large_group;
  33. public:
  34. AlgoS8DirectStride2(bool large_group) : m_large_group(large_group) {}
  35. bool is_reproducible() const override { return true; }
  36. const char* name() const override {
  37. return m_large_group ? "S8STRD2_LARGE_GROUP" : "S8STRD2_SMALL_GROUP";
  38. }
  39. bool usable(const NCBKernSizeParam& param,
  40. AlgoSelectionStrategy algo_selection_strategy) const override;
  41. size_t get_workspace(const NCBKernSizeParam& param) const override;
  42. virtual SmallVector<NCBKern> dispatch_kerns(
  43. const NCBKernSizeParam& param) const override;
  44. };
  45. class ConvBiasImpl::AlgoS8DirectNCHW44 final : public AlgoBase {
  46. public:
  47. AlgoS8DirectNCHW44() {}
  48. bool is_reproducible() const override { return true; }
  49. const char* name() const override { return "S8_NCHW44_DIRECT"; }
  50. bool usable(const NCBKernSizeParam& param,
  51. AlgoSelectionStrategy algo_selection_strategy) const override;
  52. size_t get_workspace(const NCBKernSizeParam& param) const override;
  53. virtual SmallVector<NCBKern> dispatch_kerns(
  54. const NCBKernSizeParam& param) const override;
  55. bool is_preferred(const NCBKernSizeParam& param) const override;
  56. };
  57. class ConvBiasImpl::AlgoS8DirectNCHWNCHW44 final : public AlgoBase {
  58. public:
  59. AlgoS8DirectNCHWNCHW44() {}
  60. bool is_reproducible() const override { return true; }
  61. const char* name() const override { return "S8_CONV_NCHW_NCHW44"; }
  62. bool usable(const NCBKernSizeParam& param,
  63. AlgoSelectionStrategy algo_selection_strategy) const override;
  64. size_t get_workspace(const NCBKernSizeParam& param) const override;
  65. virtual SmallVector<NCBKern> dispatch_kerns(
  66. const NCBKernSizeParam& param) const override;
  67. bool is_preferred(const NCBKernSizeParam& param) const override;
  68. };
  69. class ConvBiasImpl::AlgoS8ChanWiseStride1NCHW44 final : public AlgoBase {
  70. public:
  71. bool is_reproducible() const override { return true; }
  72. const char* name() const override { return "S8_CHAN_WISE_STRD1_NCHW44"; }
  73. bool usable(const NCBKernSizeParam& param,
  74. AlgoSelectionStrategy algo_selection_strategy) const override;
  75. size_t get_workspace(const NCBKernSizeParam& param) const override;
  76. virtual SmallVector<NCBKern> dispatch_kerns(
  77. const NCBKernSizeParam& param) const override;
  78. };
  79. class ConvBiasImpl::AlgoS8ChanWiseStride2NCHW44 final : public AlgoBase {
  80. public:
  81. bool is_reproducible() const override { return true; }
  82. const char* name() const override { return "S8_CHAN_WISE_STRD2_NCHW44"; }
  83. bool usable(const NCBKernSizeParam& param,
  84. AlgoSelectionStrategy algo_selection_strategy) const override;
  85. size_t get_workspace(const NCBKernSizeParam& param) const override;
  86. virtual SmallVector<NCBKern> dispatch_kerns(
  87. const NCBKernSizeParam& param) const override;
  88. };
  89. #if __ARM_FEATURE_DOTPROD
  90. class ConvBiasImpl::AlgoDotS8DirectNCHWNCHW44 final : public AlgoBase {
  91. public:
  92. bool is_reproducible() const override { return true; }
  93. const char* name() const override { return "ARMDOTS8_NCHW_NCHW44"; }
  94. bool usable(const NCBKernSizeParam&,
  95. AlgoSelectionStrategy algo_selection_strategy) const override;
  96. size_t get_workspace(const NCBKernSizeParam&) const override;
  97. virtual SmallVector<NCBKern> dispatch_kerns(
  98. const NCBKernSizeParam& param) const override;
  99. };
  100. class ConvBiasImpl::AlgoDotS8DirectStride1 final : public AlgoBase {
  101. bool m_large_group;
  102. public:
  103. AlgoDotS8DirectStride1(bool large_group) : m_large_group(large_group) {}
  104. bool is_reproducible() const override { return true; }
  105. const char* name() const override {
  106. return m_large_group ? "ARMDOTS8STRD1_LARGE_GROUP"
  107. : "ARMDOTS8STRD1_SMALL_GROUP";
  108. }
  109. bool usable(const NCBKernSizeParam&,
  110. AlgoSelectionStrategy algo_selection_strategy) const override;
  111. size_t get_workspace(const NCBKernSizeParam&) const override;
  112. virtual SmallVector<NCBKern> dispatch_kerns(
  113. const NCBKernSizeParam& param) const override;
  114. };
  115. class ConvBiasImpl::AlgoDotS8DirectStride2 final : public AlgoBase {
  116. bool m_large_group;
  117. public:
  118. AlgoDotS8DirectStride2(bool large_group) : m_large_group(large_group) {}
  119. bool is_reproducible() const override { return true; }
  120. const char* name() const override {
  121. return m_large_group ? "ARMDOTS8STRD2_LARGE_GROUP"
  122. : "ARMDOTS8STRD2_SMALL_GROUP";
  123. }
  124. bool usable(const NCBKernSizeParam&,
  125. AlgoSelectionStrategy algo_selection_strategy) const override;
  126. size_t get_workspace(const NCBKernSizeParam&) const override;
  127. virtual SmallVector<NCBKern> dispatch_kerns(
  128. const NCBKernSizeParam& param) const override;
  129. };
  130. class ConvBiasImpl::AlgoDotS8Direct_NCHW44 final : public AlgoBase {
  131. public:
  132. AlgoDotS8Direct_NCHW44() {}
  133. bool is_reproducible() const override { return true; }
  134. const char* name() const override { return "ARMDOTS8DIRECT_NCHW44"; }
  135. bool usable(const NCBKernSizeParam&,
  136. AlgoSelectionStrategy algo_selection_strategy) const override;
  137. size_t get_workspace(const NCBKernSizeParam&) const override;
  138. SmallVector<NCBKern> dispatch_kerns(
  139. const NCBKernSizeParam& param) const override;
  140. bool is_preferred(const NCBKernSizeParam& param) const override;
  141. };
  142. #endif
  143. class ConvBiasImpl::AlgoS8WinogradF23_8x8 final : public AlgoBase {
  144. public:
  145. AlgoS8WinogradF23_8x8(fallback::MatrixMulImpl::AlgoBase* matmul_algo,
  146. uint32_t tile_size)
  147. : m_matmul_algo{matmul_algo}, m_tile_size{tile_size} {}
  148. const char* name() const override {
  149. if (m_name.empty()) {
  150. m_name = ConvBiasImpl::algo_name<ConvBias::WinogradParam>(
  151. m_matmul_algo->name(), {8, 2, m_tile_size});
  152. }
  153. return m_name.c_str();
  154. }
  155. MEGDNN_WINOGRAD_ALGO_FUN_DECLARE();
  156. };
  157. //=======================input int8 compute fp32 output int8============
  158. class ConvBiasImpl::AlgoS8CF32WinogradF23_4x4_NCHW44 final : public AlgoBase {
  159. public:
  160. AlgoS8CF32WinogradF23_4x4_NCHW44(
  161. fallback::MatrixMulImpl::AlgoBase* matmul_algo, uint32_t tile_size)
  162. : m_matmul_algo{matmul_algo}, m_tile_size{tile_size} {}
  163. const char* name() const override {
  164. if (m_name.empty()) {
  165. m_name = ConvBiasImpl::algo_name<ConvBias::WinogradParam>(
  166. m_matmul_algo->name(), {4, 2, m_tile_size},
  167. param::ConvBias::Format::NCHW44);
  168. }
  169. return m_name.c_str();
  170. }
  171. MEGDNN_WINOGRAD_ALGO_FUN_DECLARE();
  172. };
  173. //=======================input int8 compute int16 output int8============
  174. class ConvBiasImpl::AlgoS8WinogradF23_8x8_NCHW44 final : public AlgoBase {
  175. public:
  176. AlgoS8WinogradF23_8x8_NCHW44(fallback::MatrixMulImpl::AlgoBase* matmul_algo,
  177. uint32_t tile_size)
  178. : m_matmul_algo{matmul_algo}, m_tile_size{tile_size} {}
  179. const char* name() const override {
  180. if (m_name.empty()) {
  181. m_name = ConvBiasImpl::algo_name<ConvBias::WinogradParam>(
  182. m_matmul_algo->name(), {8, 2, m_tile_size},
  183. param::ConvBias::Format::NCHW44);
  184. }
  185. return m_name.c_str();
  186. }
  187. MEGDNN_WINOGRAD_ALGO_FUN_DECLARE();
  188. };
  189. } // namespace arm_common
  190. } // namespace megdnn
  191. // vim: syntax=cpp.doxygen

MegEngine 安装包中集成了使用 GPU 运行代码所需的 CUDA 环境,不用区分 CPU 和 GPU 版。 如果想要运行 GPU 程序,请确保机器本身配有 GPU 硬件设备并安装好驱动。 如果你想体验在云端 GPU 算力平台进行深度学习开发的感觉,欢迎访问 MegStudio 平台