You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

matrix_mul.cpp 2.8 kB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879
  1. /**
  2. * \file dnn/test/cpu/matrix_mul.cpp
  3. * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
  4. *
  5. * Copyright (c) 2014-2020 Megvii Inc. All rights reserved.
  6. *
  7. * Unless required by applicable law or agreed to in writing,
  8. * software distributed under the License is distributed on an
  9. * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. */
  11. #include "test/cpu/fixture.h"
  12. #include <chrono>
  13. #include "test/common/benchmarker.h"
  14. #include "test/common/checker.h"
  15. #include "test/common/matrix_mul.h"
  16. using namespace megdnn;
  17. using namespace test;
  18. namespace {
  19. void sgemm_sgemv_like(const float* __restrict A, const float* __restrict B,
  20. float* __restrict C, size_t M, size_t N, size_t K,
  21. size_t Astride, size_t Bstride, size_t Cstride) {
  22. for (size_t m = 0; m < M; ++m) {
  23. memset(C + m * Cstride, 0, sizeof(float) * N);
  24. for (size_t k = 0; k < K; ++k)
  25. for (size_t n = 0; n < N; ++n) {
  26. C[m * Cstride + n] += A[m * Astride + k] * B[k * Bstride + n];
  27. }
  28. }
  29. }
  30. float benchmark_sgemm_sgemv_like(size_t M, size_t N, size_t K) {
  31. float *A = (float*)malloc(sizeof(float) * M * K),
  32. *B = (float*)malloc(sizeof(float) * K * N),
  33. *C = (float*)malloc(sizeof(float) * M * N);
  34. for (size_t i = 0; i < M * K; ++i)
  35. A[i] = (float)rand() / RAND_MAX;
  36. for (size_t i = 0; i < K * N; ++i)
  37. B[i] = (float)rand() / RAND_MAX;
  38. sgemm_sgemv_like(A, B, C, M, N, K, K, N, N);
  39. auto start = std::chrono::high_resolution_clock::now();
  40. for (size_t i = 0; i < 100; ++i) {
  41. sgemm_sgemv_like(A, B, C, M, N, K, K, N, N);
  42. }
  43. auto stop = std::chrono::high_resolution_clock::now();
  44. free(A);
  45. free(B);
  46. free(C);
  47. return std::chrono::duration_cast<std::chrono::milliseconds>(stop - start)
  48. .count();
  49. }
  50. } // namespace
  51. TEST_F(CPU, BENCHMARK_MATRIX_MUL) {
  52. Benchmarker<MatrixMul> benchmarker(handle());
  53. benchmarker.set_times(100);
  54. benchmarker.set_display(false);
  55. auto run = [&](size_t M, size_t N, size_t K) {
  56. std::cout << M << "x" << N << "x" << K << " ";
  57. auto time_in_ms_megdnn = benchmarker.exec({{M, K}, {K, N}, {}});
  58. auto time_in_ms_our = benchmark_sgemm_sgemv_like(M, N, K);
  59. std::cout << "megdnn=" << (int)time_in_ms_megdnn
  60. << " sgemv_like=" << time_in_ms_our << std::endl;
  61. };
  62. for (size_t m = 1; m <= 8; m *= 2)
  63. for (size_t nk = 128; nk <= 1024; nk *= 2) {
  64. run(m, nk, nk);
  65. }
  66. }
  67. TEST_F(CPU, MATRIX_MUL) {
  68. matrix_mul::check_matrix_mul(dtype::Float32{}, dtype::Float32{},
  69. dtype::Float32{}, handle());
  70. }
  71. // vim: syntax=cpp.doxygen

MegEngine 安装包中集成了使用 GPU 运行代码所需的 CUDA 环境,不用区分 CPU 和 GPU 版。 如果想要运行 GPU 程序,请确保机器本身配有 GPU 硬件设备并安装好驱动。 如果你想体验在云端 GPU 算力平台进行深度学习开发的感觉,欢迎访问 MegStudio 平台

Contributors (1)