You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

matrix_mul.cpp 2.8 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081
  1. /**
  2. * \file dnn/test/cpu/matrix_mul.cpp
  3. * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
  4. *
  5. * Copyright (c) 2014-2020 Megvii Inc. All rights reserved.
  6. *
  7. * Unless required by applicable law or agreed to in writing,
  8. * software distributed under the License is distributed on an
  9. * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. */
  11. #include "test/cpu/fixture.h"
  12. #include <chrono>
  13. #include "test/common/benchmarker.h"
  14. #include "test/common/checker.h"
  15. #include "test/common/matrix_mul.h"
  16. using namespace megdnn;
  17. using namespace test;
  18. #if MEGDNN_WITH_BENCHMARK
  19. namespace {
  20. void sgemm_sgemv_like(const float* __restrict A, const float* __restrict B,
  21. float* __restrict C, size_t M, size_t N, size_t K,
  22. size_t Astride, size_t Bstride, size_t Cstride) {
  23. for (size_t m = 0; m < M; ++m) {
  24. memset(C + m * Cstride, 0, sizeof(float) * N);
  25. for (size_t k = 0; k < K; ++k)
  26. for (size_t n = 0; n < N; ++n) {
  27. C[m * Cstride + n] += A[m * Astride + k] * B[k * Bstride + n];
  28. }
  29. }
  30. }
  31. float benchmark_sgemm_sgemv_like(size_t M, size_t N, size_t K) {
  32. float *A = (float*)malloc(sizeof(float) * M * K),
  33. *B = (float*)malloc(sizeof(float) * K * N),
  34. *C = (float*)malloc(sizeof(float) * M * N);
  35. for (size_t i = 0; i < M * K; ++i)
  36. A[i] = (float)rand() / RAND_MAX;
  37. for (size_t i = 0; i < K * N; ++i)
  38. B[i] = (float)rand() / RAND_MAX;
  39. sgemm_sgemv_like(A, B, C, M, N, K, K, N, N);
  40. auto start = std::chrono::high_resolution_clock::now();
  41. for (size_t i = 0; i < 100; ++i) {
  42. sgemm_sgemv_like(A, B, C, M, N, K, K, N, N);
  43. }
  44. auto stop = std::chrono::high_resolution_clock::now();
  45. free(A);
  46. free(B);
  47. free(C);
  48. return std::chrono::duration_cast<std::chrono::milliseconds>(stop - start)
  49. .count();
  50. }
  51. } // namespace
  52. TEST_F(CPU, BENCHMARK_MATRIX_MUL) {
  53. Benchmarker<MatrixMul> benchmarker(handle());
  54. benchmarker.set_times(100);
  55. benchmarker.set_display(false);
  56. auto run = [&](size_t M, size_t N, size_t K) {
  57. std::cout << M << "x" << N << "x" << K << " ";
  58. auto time_in_ms_megdnn = benchmarker.exec({{M, K}, {K, N}, {}});
  59. auto time_in_ms_our = benchmark_sgemm_sgemv_like(M, N, K);
  60. std::cout << "megdnn=" << (int)time_in_ms_megdnn
  61. << " sgemv_like=" << time_in_ms_our << std::endl;
  62. };
  63. for (size_t m = 1; m <= 8; m *= 2)
  64. for (size_t nk = 128; nk <= 1024; nk *= 2) {
  65. run(m, nk, nk);
  66. }
  67. }
  68. #endif
  69. TEST_F(CPU, MATRIX_MUL) {
  70. matrix_mul::check_matrix_mul(dtype::Float32{}, dtype::Float32{},
  71. dtype::Float32{}, handle());
  72. }
  73. // vim: syntax=cpp.doxygen

MegEngine 安装包中集成了使用 GPU 运行代码所需的 CUDA 环境,不用区分 CPU 和 GPU 版。 如果想要运行 GPU 程序,请确保机器本身配有 GPU 硬件设备并安装好驱动。 如果你想体验在云端 GPU 算力平台进行深度学习开发的感觉,欢迎访问 MegStudio 平台