You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

opr_impl.h 3.2 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108
  1. /**
  2. * \file dnn/src/arm_common/conv_bias/opr_impl.h
  3. * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
  4. *
  5. * Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  6. *
  7. * Unless required by applicable law or agreed to in writing,
  8. * software distributed under the License is distributed on an
  9. * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or
  10. * implied.
  11. */
  12. #pragma once
  13. #include "src/common/utils.h"
  14. #include "src/fallback/conv_bias/opr_impl.h"
  15. #include "src/common/algo_base.h"
  16. namespace megdnn {
  17. namespace arm_common {
  18. class ConvBiasImpl : public fallback::ConvBiasImpl {
  19. public:
  20. using fallback::ConvBiasImpl::ConvBiasImpl;
  21. bool is_thread_safe() const override { return true; }
  22. class AlgoBase : public fallback::ConvBiasImpl::AlgoBase {
  23. public:
  24. AlgoBase() : fallback::ConvBiasImpl::AlgoBase() {
  25. m_handle_type = Handle::HandleType::ARM_COMMON;
  26. }
  27. };
  28. SmallVector<fallback::ConvBiasImpl::AlgoBase*> get_all_packed_algo() override;
  29. bool is_matmul_quantized_prefer(
  30. const fallback::ConvBiasImpl::NCBKernSizeParam& ncb_param)
  31. const override;
  32. SmallVector<AlgoCategory> suggest_algo_category_order(
  33. const NCBKernSizeParam& param) const override;
  34. MEGDNN_FB_DECL_GET_ALGO_FROM_DESC(ConvBiasImpl);
  35. protected:
  36. const char* get_algorithm_set_name() const override;
  37. private:
  38. class AlgoS8DirectStride1;
  39. class AlgoS8DirectStride2;
  40. class AlgoS8DirectNCHW44;
  41. class AlgoS8x8x16DirectNCHW44;
  42. class AlgoS8DirectNCHWNCHW44;
  43. class AlgoQU8DirectStride1;
  44. class AlgoQU8DirectStride2;
  45. class AlgoFP32WinogradF23_4x4;
  46. class AlgoFP32WinogradF63;
  47. class AlgoFP32WinogradF63_4x4;
  48. class AlgoFP32WinogradF54;
  49. class AlgoFP32WinogradF45;
  50. class AlgoFP32WinogradF23_4x4_NCHW44;
  51. class AlgoFP32WinogradF63_4x4_NCHW44;
  52. class AlgoFP32WinogradF73_4x4_NCHW44;
  53. class AlgoS8ChanWiseStride1NCHW44;
  54. class AlgoS8ChanWiseStride2NCHW44;
  55. class AlgoS8x8x16ChanWiseStride1Stride2NCHW44;
  56. #if __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
  57. class AlgoFP16WinogradF23;
  58. class AlgoFP16WinogradF45;
  59. class AlgoFP16WinogradF63;
  60. class AlgoFP16WinogradF23_8x8;
  61. #endif
  62. #if MGB_ENABLE_DOT
  63. class AlgoDotS8DirectNCHWNCHW44;
  64. class AlgoDotS8DirectStride1;
  65. class AlgoDotS8DirectStride2;
  66. class AlgoDotU8DirectStride1;
  67. class AlgoDotU8DirectStride2;
  68. class AlgoDotS8Direct_NCHW44;
  69. #endif
  70. class AlgoF32Direct;
  71. class AlgoF32DirectStride1;
  72. class AlgoF32DirectStride2;
  73. class AlgoF32DirectNCHWNCHW44;
  74. class AlgoF32ChannelWiseNCHW44;
  75. class AlgoF32DirectNCHW44;
  76. class AlgoI8x8x16Direct;
  77. class AlgoI8x8x16Stride2;
  78. class AlgoI8x8x16Stride2Filter2;
  79. class AlgoI8x8x16DirectNCHWNCHW44;
  80. class AlgoS8WinogradF23_8x8;
  81. class AlgoS8CF32WinogradF23_4x4_NCHW44;
  82. class AlgoS8WinogradF23_8x8_NCHW44;
  83. #if __ARM_FEATURE_FP16_VECTOR_ARITHMETIC
  84. class AlgoF16Direct;
  85. class AlgoF16DirectStride1;
  86. #endif
  87. class AlgoPack;
  88. static const AlgoPack& algo_pack();
  89. };
  90. } // namespace arm_common
  91. } // namespace megdnn
  92. // vim: syntax=cpp.doxygen

MegEngine 安装包中集成了使用 GPU 运行代码所需的 CUDA 环境,不用区分 CPU 和 GPU 版。 如果想要运行 GPU 程序,请确保机器本身配有 GPU 硬件设备并安装好驱动。 如果你想体验在云端 GPU 算力平台进行深度学习开发的感觉,欢迎访问 MegStudio 平台