You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

extra_impl_helper.h 1.7 kB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253
  1. #pragma once
  2. #include "megdnn/basic_types.h"
  3. #include "megdnn/handle.h"
  4. #include "megdnn/oprs/general.h"
  5. #include "test/common/opr_proxy.h"
  6. namespace megdnn {
  7. namespace test {
  8. template <typename Opr, int NR_OUTPUTS = 1, typename Proxy = OprProxy<Opr>>
  9. std::function<void(const TensorNDArray&)> extra_impl_helper(
  10. Handle* h, const typename Opr::Param& p) {
  11. auto impl = [](const TensorNDArray& tensors, Handle* h,
  12. const typename Opr::Param& p) {
  13. static_assert(
  14. NR_OUTPUTS <= OprTrait<Opr>::arity,
  15. "OutNumber should less than or equal to arity.");
  16. Proxy proxy;
  17. auto fp32_opr = h->create_operator<Opr>();
  18. auto type_cvt = h->create_operator<TypeCvt>();
  19. fp32_opr->param() = p;
  20. TensorNDArray fp32_tensors;
  21. for (size_t i = 0; i < tensors.size(); ++i) {
  22. auto layout = tensors[i].layout;
  23. layout.dtype = dtype::Float32();
  24. fp32_tensors.emplace_back(malloc(layout.span().dist_byte()), layout);
  25. type_cvt->exec(tensors[i], fp32_tensors[i]);
  26. }
  27. proxy.exec(fp32_opr.get(), fp32_tensors);
  28. for (size_t i = fp32_tensors.size() - NR_OUTPUTS; i < fp32_tensors.size();
  29. ++i) {
  30. type_cvt->exec(fp32_tensors[i], tensors[i]);
  31. }
  32. for (size_t i = 0; i < tensors.size(); ++i) {
  33. free(fp32_tensors[i].raw_ptr());
  34. }
  35. };
  36. return std::bind(impl, std::placeholders::_1, h, std::cref(p));
  37. }
  38. template <>
  39. std::function<void(const TensorNDArray&)> extra_impl_helper<AddUpdate>(
  40. Handle* h, const AddUpdate::Param& p);
  41. } // namespace test
  42. } // namespace megdnn
  43. // vim: syntax=cpp.doxygen