You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

network_visualize.py 6.7 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186
  1. #! /usr/bin/env python3
  2. # MegEngine is Licensed under the Apache License, Version 2.0 (the "License")
  3. #
  4. # Copyright (c) 2014-2021 Megvii Inc. All rights reserved.
  5. #
  6. # Unless required by applicable law or agreed to in writing,
  7. # software distributed under the License is distributed on an
  8. # "AS IS" BASIS, WITHOUT ARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  9. import argparse
  10. import logging
  11. import numpy as np
  12. from megengine.core.tensor.dtype import is_quantize
  13. from megengine.logger import _imperative_rt_logger, get_logger, set_mgb_log_level
  14. from megengine.utils.module_stats import (
  15. print_flops_stats,
  16. print_params_stats,
  17. sizeof_fmt,
  18. )
  19. from megengine.utils.network import Network
  20. logger = get_logger(__name__)
  21. def visualize(
  22. model_path: str,
  23. log_path: str,
  24. bar_length_max: int = 20,
  25. log_params: bool = True,
  26. log_flops: bool = True,
  27. ):
  28. r"""
  29. Load megengine dumped model and visualize graph structure with tensorboard log files.
  30. Can also record and print model's statistics like :func:`~.module_stats`
  31. :param model_path: dir path for megengine dumped model.
  32. :param log_path: dir path for tensorboard graph log.
  33. :param bar_length_max: size of bar indicating max flops or parameter size in net stats.
  34. :param log_params: whether print and record params size.
  35. :param log_flops: whether print and record op flops.
  36. """
  37. try:
  38. from tensorboard.compat.proto.attr_value_pb2 import AttrValue
  39. from tensorboard.compat.proto.config_pb2 import RunMetadata
  40. from tensorboard.compat.proto.graph_pb2 import GraphDef
  41. from tensorboard.compat.proto.node_def_pb2 import NodeDef
  42. from tensorboard.compat.proto.step_stats_pb2 import (
  43. AllocatorMemoryUsed,
  44. DeviceStepStats,
  45. NodeExecStats,
  46. StepStats,
  47. )
  48. from tensorboard.compat.proto.tensor_shape_pb2 import TensorShapeProto
  49. from tensorboard.compat.proto.versions_pb2 import VersionDef
  50. from tensorboardX import SummaryWriter
  51. except ImportError:
  52. logger.error(
  53. "TensorBoard and TensorboardX are required for visualize.", exc_info=True
  54. )
  55. return
  56. # FIXME: remove this after resolving "span dist too large" warning
  57. old_level = set_mgb_log_level(logging.ERROR)
  58. graph = Network.load(model_path)
  59. writer = SummaryWriter(log_path)
  60. def process_name(name):
  61. return name.replace(".", "/").encode(encoding="utf-8")
  62. node_list = []
  63. flops_list = []
  64. params_list = []
  65. for node in graph.all_oprs:
  66. if hasattr(node, "output_idx"):
  67. node_oup = node.outputs[node.output_idx]
  68. else:
  69. if len(node.outputs) != 1:
  70. logger.warning(
  71. "OpNode {} has more than one output and not has 'output_idx' attr.".format(
  72. node
  73. )
  74. )
  75. node_oup = node.outputs[0]
  76. inp_list = [process_name(var.owner.name) for var in node.inputs]
  77. attr = {
  78. "_output_shapes": AttrValue(
  79. list=AttrValue.ListValue(
  80. shape=[
  81. TensorShapeProto(
  82. dim=[TensorShapeProto.Dim(size=d) for d in node_oup.shape]
  83. )
  84. ]
  85. )
  86. ),
  87. }
  88. if hasattr(node, "calc_flops"):
  89. flops_num = node.calc_flops()
  90. # add op flops attr
  91. attr["flops"] = AttrValue(s=sizeof_fmt(flops_num).encode(encoding="utf-8"))
  92. flops_list.append(
  93. dict(
  94. name=node.name,
  95. class_name=node.type,
  96. input_shapes=[i.shape for i in node.inputs],
  97. output_shapes=[o.shape for o in node.outputs],
  98. flops_num=flops_num,
  99. flops_cum=0,
  100. )
  101. )
  102. if node.type == "ImmutableTensor":
  103. param_dim = np.prod(node_oup.shape)
  104. # TODO: consider other quantize dtypes
  105. param_bytes = 1 if is_quantize(node_oup.dtype) else 4
  106. # add tensor size attr
  107. attr["size"] = AttrValue(
  108. s=sizeof_fmt(param_dim * param_bytes).encode(encoding="utf-8")
  109. )
  110. params_list.append(
  111. dict(
  112. name=node.name,
  113. shape=node_oup.shape,
  114. param_dim=param_dim,
  115. bits=param_bytes * 8,
  116. size=param_dim * param_bytes,
  117. size_cum=0,
  118. mean="{:.2g}".format(node.numpy().mean()),
  119. std="{:.2g}".format(node.numpy().std()),
  120. )
  121. )
  122. # FIXME(MGE-2165): nodes outside network module may lead to unknown display bug
  123. if not len(node.name.split(".")) > 2 and not node in graph.input_vars:
  124. continue
  125. node_list.append(
  126. NodeDef(
  127. name=process_name(node.name), op=node.type, input=inp_list, attr=attr,
  128. )
  129. )
  130. total_flops, total_params = 0, 0
  131. if log_params:
  132. total_params = print_params_stats(params_list, bar_length_max)
  133. if log_flops:
  134. total_flops = print_flops_stats(flops_list, bar_length_max)
  135. graph_def = GraphDef(node=node_list, versions=VersionDef(producer=22))
  136. device = "/device:CPU:0"
  137. stepstats = RunMetadata(
  138. step_stats=StepStats(dev_stats=[DeviceStepStats(device=device)])
  139. )
  140. writer._get_file_writer().add_graph((graph_def, stepstats))
  141. # FIXME: remove this after resolving "span dist too large" warning
  142. _imperative_rt_logger.set_log_level(old_level)
  143. return total_params, total_flops
  144. def main():
  145. parser = argparse.ArgumentParser(
  146. description="load a megengine dumped model and export log file for tensorboard visualization.",
  147. formatter_class=argparse.ArgumentDefaultsHelpFormatter,
  148. )
  149. parser.add_argument("model_path", help="dumped model path.")
  150. parser.add_argument("log_path", help="tensorboard log path.")
  151. parser.add_argument(
  152. "--bar_length_max",
  153. type=int,
  154. default=20,
  155. help="size of bar indicating max flops or parameter size in net stats.",
  156. )
  157. parser.add_argument(
  158. "--log_params",
  159. action="store_true",
  160. help="whether print and record params size.",
  161. )
  162. parser.add_argument(
  163. "--log_flops", action="store_true", help="whether print and record op flops.",
  164. )
  165. visualize(**vars(parser.parse_args()))
  166. if __name__ == "__main__":
  167. main()

MegEngine 安装包中集成了使用 GPU 运行代码所需的 CUDA 环境,不用区分 CPU 和 GPU 版。 如果想要运行 GPU 程序,请确保机器本身配有 GPU 硬件设备并安装好驱动。 如果你想体验在云端 GPU 算力平台进行深度学习开发的感觉,欢迎访问 MegStudio 平台