/** * \file dnn/test/cuda/warp_affine.cpp * MegEngine is Licensed under the Apache License, Version 2.0 (the "License") * * Copyright (c) 2014-2021 Megvii Inc. All rights reserved. * * Unless required by applicable law or agreed to in writing, * software distributed under the License is distributed on an * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. */ #include "test/common/warp_affine.h" #include "include/megdnn/thin/small_vector.h" #include "test/common/benchmarker.h" #include "test/common/checker.h" #include "test/cuda/fixture.h" namespace megdnn { namespace test { // FIXME test WARP_PERSPECTIVE_CV failed here #if 0 TEST_F(CUDA, WARP_AFFINE_CV) { using namespace warp_affine; std::vector args = get_cv_args(); Checker checker(handle_cuda()); for (auto &&arg: args) { if (arg.src[3] == 2) continue; checker.set_param(arg.param) .set_epsilon(1 + 1e-3) .set_dtype(0, dtype::Uint8()) .set_dtype(1, dtype::Float32()) .set_dtype(2, dtype::Uint8()) .execs({arg.src, arg.trans, arg.dst}); } for (auto &&arg: args) { if (arg.src[3] == 2) continue; checker.set_param(arg.param) .set_dtype(0, dtype::Float32()) .set_dtype(1, dtype::Float32()) .set_dtype(2, dtype::Float32()) .execs({arg.src, arg.trans, arg.dst}); } } #endif TEST_F(CUDA, WARP_AFFINE) { //! NCHW for (auto dtype : std::vector{dtype::Float32()}) { for (auto bmode : {WarpAffine::BorderMode::WRAP, WarpAffine::BorderMode::REFLECT, WarpAffine::BorderMode::CONSTANT, WarpAffine::BorderMode::REPLICATE, WarpAffine::BorderMode::CONSTANT}) { Checker checker(handle_cuda()); NormalRNG rng; checker.set_rng(1, &rng); WarpAffine::Param param; param.border_val = 0.3f; param.border_mode = bmode; param.imode = param::WarpAffine::InterpolationMode::LINEAR; param.format = param::WarpAffine::Format::NCHW; checker.set_param(param); checker.set_dtype(0, dtype); checker.set_dtype(1, dtype); checker.set_dtype(2, dtype); checker.execs({{2, 3, 10, 11}, {2, 2, 3}, {2, 3, 11, 12}}); checker.execs({{22, 3, 10, 11}, {22, 2, 3}, {22, 3, 11, 12}}); } } //! NHWC for (auto dtype : std::vector{dtype::Float32()}) { for (auto bmode : {WarpAffine::BorderMode::WRAP, WarpAffine::BorderMode::REFLECT, WarpAffine::BorderMode::CONSTANT, WarpAffine::BorderMode::REPLICATE, WarpAffine::BorderMode::CONSTANT}) { Checker checker(handle_cuda()); NormalRNG rng; checker.set_rng(1, &rng); WarpAffine::Param param; param.format = param::WarpAffine::Format::NHWC; param.border_val = 0.3f; param.border_mode = bmode; param.imode = param::WarpAffine::InterpolationMode::LINEAR; checker.set_param(param); checker.set_dtype(0, dtype); checker.set_dtype(1, dtype); checker.set_dtype(2, dtype); checker.execs({{2, 3, 10, 11}, {2, 2, 3}, {2, 12, 11, 11}}); checker.execs({{22, 3, 10, 12}, {22, 2, 3}, {22, 3, 11, 12}}); } } } #if MEGDNN_WITH_BENCHMARK TEST_F(CUDA, WARP_AFFINE_BENCHMARK) { const size_t RUNS = 50; Benchmarker benchmark(handle_cuda()); benchmark.set_display(false); benchmark.set_times(RUNS); using Param = param::WarpAffine; Param param; auto run = [&benchmark, ¶m](TensorShape src, TensorShape mat, TensorShape dst) { benchmark.set_param(param); auto used = benchmark.execs({src, mat, dst}); printf("src: %s dst: %s used: %.2f ms %.2f Gflops\n", src.to_string().c_str(), dst.to_string().c_str(), used, //! 8 mul + 3 add 11 * dst.total_nr_elems() / (used / RUNS) / 1e6); }; run({1, 100, 100, 1}, {1, 2, 3}, {1, 112, 112, 1}); run({512, 100, 100, 1}, {512, 2, 3}, {512, 112, 112, 1}); } #endif } // namespace test } // namespace megdnn // vim: syntax=cpp.doxygen