You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

python_c_extension.cpp 10 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313
  1. /**
  2. * \file imperative/tablegen/targets/python_c_extension.cpp
  3. * MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
  4. *
  5. * Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  6. *
  7. * Unless required by applicable law or agreed to in writing,
  8. * software distributed under the License is distributed on an
  9. * "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. */
  11. #include "python_c_extension.h"
  12. #include "../emitter.h"
  13. namespace mlir::tblgen {
  14. namespace {
  15. struct Initproc {
  16. std::string func;
  17. Initproc(std::string&& s): func(std::move(s)) {}
  18. std::string operator()(std::string argument) {
  19. return formatv("{0}({1})", func, argument);
  20. }
  21. };
  22. class OpDefEmitter: public EmitterBase {
  23. public:
  24. OpDefEmitter(MgbOp& op_, raw_ostream& os_, Environment& env_):
  25. EmitterBase(os_, env_), op(op_) {
  26. ctx.withSelf(op.getCppClassName());
  27. }
  28. Initproc emit();
  29. private:
  30. void emit_class();
  31. void emit_py_init();
  32. void emit_py_getsetters();
  33. Initproc emit_initproc();
  34. MgbOp& op;
  35. std::vector<Initproc> subclasses;
  36. mlir::tblgen::FmtContext ctx;
  37. };
  38. class EnumAttrEmitter: public EmitterBase {
  39. public:
  40. EnumAttrEmitter(llvm::StringRef parent, MgbEnumAttr* attr_, raw_ostream& os_, Environment& env_):
  41. EmitterBase(os_, env_), attr(attr_) {
  42. unsigned int enumID;
  43. if (auto alias = llvm::dyn_cast<MgbAliasAttr>(attr)) {
  44. auto&& aliasBase = alias->getAliasBase();
  45. enumID = llvm::cast<MgbEnumAttr>(aliasBase).getBaseRecord()->getID();
  46. } else {
  47. enumID = attr->getBaseRecord()->getID();
  48. }
  49. ctx.addSubst("enumTpl", attr->getEnumCombinedFlag() ? "BitCombinedEnumWrapper" : "EnumWrapper");
  50. ctx.addSubst("opClass", parent);
  51. ctx.addSubst("enumClass", attr->getEnumName());
  52. firstOccur = env().enumAlias.emplace(enumID, std::make_pair(parent, attr->getEnumName())).second;
  53. }
  54. Initproc emit();
  55. protected:
  56. void emit_tpl_spl();
  57. Initproc emit_initproc();
  58. MgbEnumAttr* attr;
  59. bool firstOccur;
  60. mlir::tblgen::FmtContext ctx;
  61. };
  62. Initproc EnumAttrEmitter::emit() {
  63. emit_tpl_spl();
  64. return emit_initproc();
  65. }
  66. void EnumAttrEmitter::emit_tpl_spl() {
  67. if (!firstOccur) return;
  68. os << tgfmt(
  69. "template<> PyTypeObject $enumTpl<$opClass::$enumClass>::type={};\n",
  70. &ctx);
  71. os << tgfmt(
  72. "template<> const char* $enumTpl<$opClass::$enumClass>::name = "
  73. "\"$opClass.$enumClass\";\n",
  74. &ctx);
  75. if (attr->getEnumCombinedFlag()) {
  76. os << tgfmt(
  77. "template<> PyNumberMethods "
  78. "$enumTpl<$opClass::$enumClass>::number_methods={};\n",
  79. &ctx);
  80. os << tgfmt(
  81. "template<> struct EnumTrait<$opClass::$enumClass> { static constexpr "
  82. "bool is_bit_combined = true;};\n",
  83. &ctx);
  84. }
  85. auto str2type = [&](auto&& i) -> std::string {
  86. return tgfmt("{normalize_enum(\"$0\"), $opClass::$enumClass::$0}", &ctx, i);
  87. };
  88. os << tgfmt(R"(
  89. template<> std::unordered_map<std::string, $opClass::$enumClass>
  90. $enumTpl<$opClass::$enumClass>::str2type = {$0};
  91. )", &ctx, llvm::join(llvm::map_range(attr->getEnumMembers(), str2type), ", "));
  92. auto type2str = [&](auto&& i) -> std::string {
  93. return tgfmt("{$opClass::$enumClass::$0, normalize_enum(\"$0\")}", &ctx, i);
  94. };
  95. os << tgfmt(R"(
  96. template<> std::unordered_map<$opClass::$enumClass, std::string>
  97. $enumTpl<$opClass::$enumClass>::type2str = {$0};
  98. )", &ctx, llvm::join(llvm::map_range(attr->getEnumMembers(), type2str), ", "));
  99. }
  100. Initproc EnumAttrEmitter::emit_initproc() {
  101. std::string initproc = formatv("_init_py_{0}_{1}",
  102. ctx.getSubstFor("opClass"), ctx.getSubstFor("enumClass"));
  103. os << tgfmt(R"(
  104. void $0(PyTypeObject& py_type) {
  105. auto& e_type = $enumTpl<$opClass::$enumClass>::type;
  106. )", &ctx, initproc);
  107. if (firstOccur) {
  108. os << tgfmt(R"(
  109. e_type = {PyVarObject_HEAD_INIT(NULL, 0)};
  110. e_type.tp_name = "megengine.core._imperative_rt.ops.$opClass.$enumClass";
  111. e_type.tp_basicsize = sizeof($enumTpl<$opClass::$enumClass>);
  112. e_type.tp_flags = Py_TPFLAGS_DEFAULT | Py_TPFLAGS_BASETYPE;
  113. e_type.tp_doc = "$opClass.$enumClass";
  114. e_type.tp_base = &PyBaseObject_Type;
  115. e_type.tp_repr = $enumTpl<$opClass::$enumClass>::py_repr;
  116. e_type.tp_richcompare = $enumTpl<$opClass::$enumClass>::tp_richcompare;
  117. )", &ctx);
  118. if (attr->getEnumCombinedFlag()) {
  119. // only bit combined enum could new instance because bitwise operation,
  120. // others should always use singleton
  121. os << tgfmt(R"(
  122. e_type.tp_new = $enumTpl<$opClass::$enumClass>::py_new_combined_enum;
  123. e_type.tp_init = $enumTpl<$opClass::$enumClass>::py_init;
  124. auto& number_method = $enumTpl<$opClass::$enumClass>::number_methods;
  125. number_method.nb_or = $enumTpl<$opClass::$enumClass>::py_or;
  126. number_method.nb_and = $enumTpl<$opClass::$enumClass>::py_and;
  127. e_type.tp_as_number = &number_method;
  128. )", &ctx);
  129. }
  130. os << " mgb_assert(PyType_Ready(&e_type) >= 0);\n";
  131. for (auto&& i : attr->getEnumMembers()) {
  132. os << tgfmt(R"({
  133. PyObject* inst = e_type.tp_alloc(&e_type, 0);
  134. reinterpret_cast<$enumTpl<$opClass::$enumClass>*>(inst)->value = $opClass::$enumClass::$0;
  135. mgb_assert(PyDict_SetItemString(e_type.tp_dict, "$0", inst) >= 0);
  136. PyType_Modified(&e_type);
  137. })", &ctx, i);
  138. }
  139. }
  140. os << tgfmt(R"(
  141. mgb_assert(PyDict_SetItemString(
  142. py_type.tp_dict, "$enumClass", reinterpret_cast<PyObject*>(&e_type)) >= 0);
  143. )", &ctx);
  144. os << "}\n";
  145. return initproc;
  146. }
  147. Initproc OpDefEmitter::emit() {
  148. for (auto&& i : op.getMgbAttributes()) {
  149. if (auto attr = llvm::dyn_cast<MgbEnumAttr>(&i.attr)) {
  150. subclasses.push_back(EnumAttrEmitter(op.getCppClassName(), attr, os, env()).emit());
  151. }
  152. }
  153. emit_class();
  154. emit_py_init();
  155. emit_py_getsetters();
  156. return emit_initproc();
  157. }
  158. void OpDefEmitter::emit_class() {
  159. os << tgfmt(R"(
  160. PyOpDefBegin($_self) // {
  161. static PyGetSetDef py_getsetters[];
  162. static int py_init(PyObject *self, PyObject *args, PyObject *kwds);
  163. // };
  164. PyOpDefEnd($_self)
  165. )", &ctx);
  166. }
  167. void OpDefEmitter::emit_py_init() {
  168. std::string initBody;
  169. if (!op.getMgbAttributes().empty()) {
  170. initBody += "static const char* kwlist[] = {";
  171. std::vector<llvm::StringRef> attr_name_list;
  172. llvm::for_each(op.getMgbAttributes(), [&](auto&& attr) {
  173. attr_name_list.push_back(attr.name);
  174. });
  175. attr_name_list.push_back("scope");
  176. llvm::for_each(attr_name_list, [&](auto&& attr) {
  177. initBody += formatv("\"{0}\", ", attr);
  178. });
  179. initBody += "NULL};\n";
  180. initBody += " PyObject ";
  181. auto initializer = [&](auto&& attr) -> std::string {
  182. return formatv("*{0} = NULL", attr);
  183. };
  184. initBody += llvm::join(llvm::map_range(attr_name_list, initializer), ", ") + ";\n";
  185. initBody += " if (!PyArg_ParseTupleAndKeywords(args, kwds, \"|";
  186. // an extra slot created for name
  187. initBody += std::string(attr_name_list.size(), 'O');
  188. initBody += "\", const_cast<char**>(kwlist)";
  189. llvm::for_each(attr_name_list, [&](auto&& attr) {
  190. initBody += formatv(", &{0}", attr);
  191. });
  192. initBody += "))\n";
  193. initBody += " return -1;\n";
  194. llvm::for_each(op.getMgbAttributes(), [&](auto&& attr) {
  195. initBody += tgfmt(R"(
  196. if ($0) {
  197. try {
  198. reinterpret_cast<PyOp($_self)*>(self)->inst().$0 =
  199. pyobj_convert_generic<decltype($_self::$0)>::from($0);
  200. } CATCH_ALL(-1)
  201. }
  202. )", &ctx, attr.name);
  203. });
  204. initBody += tgfmt(R"(
  205. if (scope) {
  206. try {
  207. reinterpret_cast<PyOp(OpDef)*>(self)->op
  208. ->set_scope(pyobj_convert_generic<std::string>::from(scope));
  209. } CATCH_ALL(-1)
  210. }
  211. )", &ctx);
  212. }
  213. initBody += "\n return 0;";
  214. os << tgfmt(R"(
  215. int PyOp($_self)::py_init(PyObject *self, PyObject *args, PyObject *kwds) {
  216. $0
  217. }
  218. )", &ctx, initBody);
  219. }
  220. void OpDefEmitter::emit_py_getsetters() {
  221. auto f = [&](auto&& attr) -> std::string {
  222. return tgfmt(
  223. "{const_cast<char*>(\"$0\"), py_get_generic($_self, $0), py_set_generic($_self, $0), const_cast<char*>(\"$0\"), NULL},",
  224. &ctx, attr.name);
  225. };
  226. os << tgfmt(R"(
  227. PyGetSetDef PyOp($_self)::py_getsetters[] = {
  228. $0
  229. {NULL} /* Sentinel */
  230. };
  231. )", &ctx, llvm::join(llvm::map_range(op.getMgbAttributes(), f), "\n "));
  232. }
  233. Initproc OpDefEmitter::emit_initproc() {
  234. std::string initproc = formatv("_init_py_{0}", op.getCppClassName());
  235. std::string subclass_init_call;
  236. for (auto&& i : subclasses) {
  237. subclass_init_call += formatv(" {0};\n", i("py_type"));
  238. }
  239. os << tgfmt(R"(
  240. void $0(py::module m) {
  241. using py_op = PyOp($_self);
  242. auto& py_type = PyOpType($_self);
  243. py_type = {PyVarObject_HEAD_INIT(NULL, 0)};
  244. py_type.tp_name = "megengine.core._imperative_rt.ops.$_self";
  245. py_type.tp_basicsize = sizeof(PyOp($_self));
  246. py_type.tp_flags = Py_TPFLAGS_DEFAULT | Py_TPFLAGS_BASETYPE;
  247. py_type.tp_doc = "$_self";
  248. py_type.tp_base = &PyOpType(OpDef);
  249. py_type.tp_dealloc = py_dealloc_generic<py_op>;
  250. py_type.tp_new = py_new_generic<py_op>;
  251. py_type.tp_init = py_op::py_init;
  252. py_type.tp_getset = py_op::py_getsetters;
  253. mgb_assert(PyType_Ready(&py_type) >= 0);
  254. $1
  255. PyType_Modified(&py_type);
  256. m.add_object("$_self", reinterpret_cast<PyObject*>(&py_type));
  257. mgb_assert(PyOp(OpDef)::ctype2pytype.emplace($_self::typeinfo(), &py_type).second);
  258. }
  259. )", &ctx, initproc, subclass_init_call);
  260. return initproc;
  261. }
  262. } // namespace
  263. bool gen_op_def_python_c_extension(raw_ostream &os, llvm::RecordKeeper &keeper) {
  264. Environment env;
  265. using namespace std::placeholders;
  266. std::vector<Initproc> initprocs;
  267. foreach_operator(keeper, [&](MgbOp& op) {
  268. initprocs.emplace_back(OpDefEmitter(op, os, env).emit());
  269. });
  270. os << "#define INIT_ALL_OP(m)";
  271. for(auto&& init : initprocs) {
  272. os << formatv(" \\\n {0};", init("m"));
  273. }
  274. os << "\n";
  275. return false;
  276. }
  277. } // namespace mlir::tblgen

MegEngine 安装包中集成了使用 GPU 运行代码所需的 CUDA 环境,不用区分 CPU 和 GPU 版。 如果想要运行 GPU 程序,请确保机器本身配有 GPU 硬件设备并安装好驱动。 如果你想体验在云端 GPU 算力平台进行深度学习开发的感觉,欢迎访问 MegStudio 平台