You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

argmxx.cpp 3.2 kB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798
  1. #include "test/cuda/fixture.h"
  2. #include "megdnn/oprs.h"
  3. #include "test/common/checker.h"
  4. #include "test/common/rng.h"
  5. namespace {
  6. using namespace megdnn;
  7. using namespace test;
  8. class ArgmxxRNG final : public RNG {
  9. public:
  10. void gen(const TensorND& tensor) override {
  11. auto offset = tensor.layout.span().low_elem;
  12. auto nr_elems = tensor.layout.span().dist_elem();
  13. #define cb(DType) \
  14. if (tensor.layout.dtype == DType()) { \
  15. using ctype = typename DTypeTrait<DType>::ctype; \
  16. auto ptr = tensor.ptr<ctype>(); \
  17. for (size_t i = 0; i < nr_elems; ++i) { \
  18. ptr[offset + i] = i; \
  19. } \
  20. COMPAT_RANDOM(ptr + offset, ptr + offset + nr_elems); \
  21. }
  22. MEGDNN_FOREACH_COMPUTING_DTYPE(cb);
  23. #undef cb
  24. }
  25. };
  26. template <typename Argmxx>
  27. void test_argmxx(Handle* handle) {
  28. Checker<Argmxx> checker(handle);
  29. checker.set_dtype(1, dtype::Int32());
  30. using Param = typename Argmxx::Param;
  31. ArgmxxRNG rng;
  32. checker.set_rng(0, &rng);
  33. for (size_t axis = 0; axis < 4; ++axis) {
  34. Param param;
  35. param.axis = axis;
  36. checker.set_param(param)
  37. .set_dtype(0, dtype::Float32())
  38. .execs({{2, 3, 4, 5}, {}});
  39. checker.set_param(param)
  40. .set_dtype(0, dtype::Float16())
  41. .execs({{2, 3, 4, 5}, {}});
  42. checker.set_param(param).set_dtype(0, dtype::Int32()).execs({{2, 3, 4, 5}, {}});
  43. checker.set_param(param).set_dtype(0, dtype::Int16()).execs({{2, 3, 4, 5}, {}});
  44. checker.set_param(param).set_dtype(0, dtype::Int8()).execs({{2, 3, 4, 5}, {}});
  45. checker.set_param(param).set_dtype(0, dtype::Uint8()).execs({{2, 3, 4, 5}, {}});
  46. }
  47. checker.set_dtype(0, dtype::Float32());
  48. Param param;
  49. param.axis = 1;
  50. checker.set_param(param);
  51. // 1-step
  52. checker.execs({{2, 64, 32}, {}});
  53. // 2-step
  54. checker.execs({{2, 192, 32}, {}});
  55. // 3-step
  56. checker.execs({{2, 4333, 32}, {}});
  57. // single reduce
  58. checker.execs({{2, 1, 1}, {}});
  59. checker.execs({{2, 1 + 1, 1}, {}});
  60. checker.execs({{2, 2048 + 1, 1}, {}});
  61. checker.execs({{2, 2048 * 2048 + 1, 1}, {}});
  62. checker.execs({{2, 1 + 1, 31}, {}});
  63. checker.execs({{2, 16 + 1, 31}, {}});
  64. checker.execs({{2, 16 * 16 + 1, 31}, {}});
  65. checker.execs({{2, 16 * 16 * 16 + 1, 31}, {}});
  66. checker.execs({{2, 16 * 16 * 16 * 16 + 1, 31}, {}});
  67. checker.execs({{3, 256 * 256 + 1, 2}, {}});
  68. checker.execs({{3, 128 * 128 + 1, 3}, {}});
  69. checker.execs({{3, 64 * 64 + 1, 7}, {}});
  70. checker.execs({{3, 32 * 32 + 1, 15}, {}});
  71. checker.execs({{3, 512, 500}, {}});
  72. // very large reduce
  73. checker.execs({{1, 4194304, 1}, {}});
  74. }
  75. } // anonymous namespace
  76. namespace megdnn {
  77. namespace test {
  78. TEST_F(CUDA, ARGMAX) {
  79. test_argmxx<Argmax>(handle_cuda());
  80. }
  81. TEST_F(CUDA, ARGMIN) {
  82. test_argmxx<Argmin>(handle_cuda());
  83. }
  84. } // namespace test
  85. } // namespace megdnn
  86. // vim: syntax=cpp.doxygen