|
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502 |
-
-
- <!DOCTYPE html>
- <!--[if IE 8]><html class="no-js lt-ie9" lang="en" > <![endif]-->
- <!--[if gt IE 8]><!--> <html class="no-js" lang="en" > <!--<![endif]-->
- <head>
- <meta charset="utf-8">
-
- <meta name="viewport" content="width=device-width, initial-scale=1.0">
-
- <title>pygraph.utils.graphdataset — py-graph documentation</title>
-
-
-
-
-
-
-
-
- <script type="text/javascript" src="../../../_static/js/modernizr.min.js"></script>
-
-
- <script type="text/javascript" id="documentation_options" data-url_root="../../../" src="../../../_static/documentation_options.js"></script>
- <script type="text/javascript" src="../../../_static/jquery.js"></script>
- <script type="text/javascript" src="../../../_static/underscore.js"></script>
- <script type="text/javascript" src="../../../_static/doctools.js"></script>
- <script async="async" type="text/javascript" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.1/MathJax.js?config=TeX-AMS-MML_HTMLorMML"></script>
-
- <script type="text/javascript" src="../../../_static/js/theme.js"></script>
-
-
-
-
- <link rel="stylesheet" href="../../../_static/css/theme.css" type="text/css" />
- <link rel="stylesheet" href="../../../_static/pygments.css" type="text/css" />
- <link rel="index" title="Index" href="../../../genindex.html" />
- <link rel="search" title="Search" href="../../../search.html" />
- </head>
-
- <body class="wy-body-for-nav">
-
-
- <div class="wy-grid-for-nav">
-
- <nav data-toggle="wy-nav-shift" class="wy-nav-side">
- <div class="wy-side-scroll">
- <div class="wy-side-nav-search" >
-
-
-
- <a href="../../../index.html" class="icon icon-home"> py-graph
-
-
-
- </a>
-
-
-
-
- <div class="version">
- 1.0
- </div>
-
-
-
-
- <div role="search">
- <form id="rtd-search-form" class="wy-form" action="../../../search.html" method="get">
- <input type="text" name="q" placeholder="Search docs" />
- <input type="hidden" name="check_keywords" value="yes" />
- <input type="hidden" name="area" value="default" />
- </form>
- </div>
-
-
- </div>
-
- <div class="wy-menu wy-menu-vertical" data-spy="affix" role="navigation" aria-label="main navigation">
-
-
-
-
-
-
- <!-- Local TOC -->
- <div class="local-toc"></div>
-
-
- </div>
- </div>
- </nav>
-
- <section data-toggle="wy-nav-shift" class="wy-nav-content-wrap">
-
-
- <nav class="wy-nav-top" aria-label="top navigation">
-
- <i data-toggle="wy-nav-top" class="fa fa-bars"></i>
- <a href="../../../index.html">py-graph</a>
-
- </nav>
-
-
- <div class="wy-nav-content">
-
- <div class="rst-content">
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- <div role="navigation" aria-label="breadcrumbs navigation">
-
- <ul class="wy-breadcrumbs">
-
- <li><a href="../../../index.html">Docs</a> »</li>
-
- <li><a href="../../index.html">Module code</a> »</li>
-
- <li>pygraph.utils.graphdataset</li>
-
-
- <li class="wy-breadcrumbs-aside">
-
- </li>
-
- </ul>
-
-
- <hr/>
- </div>
- <div role="main" class="document" itemscope="itemscope" itemtype="http://schema.org/Article">
- <div itemprop="articleBody">
-
- <h1>Source code for pygraph.utils.graphdataset</h1><div class="highlight"><pre>
- <span></span><span class="sd">""" Obtain all kinds of attributes of a graph dataset.</span>
- <span class="sd">"""</span>
-
-
- <div class="viewcode-block" id="get_dataset_attributes"><a class="viewcode-back" href="../../../pygraph.utils.html#pygraph.utils.graphdataset.get_dataset_attributes">[docs]</a><span class="k">def</span> <span class="nf">get_dataset_attributes</span><span class="p">(</span><span class="n">Gn</span><span class="p">,</span>
- <span class="n">target</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span>
- <span class="n">attr_names</span><span class="o">=</span><span class="p">[],</span>
- <span class="n">node_label</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span>
- <span class="n">edge_label</span><span class="o">=</span><span class="kc">None</span><span class="p">):</span>
- <span class="sd">"""Returns the structure and property information of the graph dataset Gn.</span>
-
- <span class="sd"> Parameters</span>
- <span class="sd"> ----------</span>
- <span class="sd"> Gn : List of NetworkX graph</span>
- <span class="sd"> List of graphs whose information will be returned.</span>
- <span class="sd"> target : list</span>
- <span class="sd"> The list of classification targets corresponding to Gn. Only works for </span>
- <span class="sd"> classification problems.</span>
- <span class="sd"> attr_names : list</span>
- <span class="sd"> List of strings which indicate which informations will be returned. The</span>
- <span class="sd"> possible choices includes:</span>
- <span class="sd"> 'substructures': sub-structures Gn contains, including 'linear', 'non </span>
- <span class="sd"> linear' and 'cyclic'.</span>
- <span class="sd"> 'node_labeled': whether vertices have symbolic labels.</span>
- <span class="sd"> 'edge_labeled': whether egdes have symbolic labels.</span>
- <span class="sd"> 'is_directed': whether graphs in Gn are directed.</span>
- <span class="sd"> 'dataset_size': number of graphs in Gn.</span>
- <span class="sd"> 'ave_node_num': average number of vertices of graphs in Gn.</span>
- <span class="sd"> 'min_node_num': minimum number of vertices of graphs in Gn.</span>
- <span class="sd"> 'max_node_num': maximum number of vertices of graphs in Gn.</span>
- <span class="sd"> 'ave_edge_num': average number of edges of graphs in Gn.</span>
- <span class="sd"> 'min_edge_num': minimum number of edges of graphs in Gn.</span>
- <span class="sd"> 'max_edge_num': maximum number of edges of graphs in Gn.</span>
- <span class="sd"> 'ave_node_degree': average vertex degree of graphs in Gn.</span>
- <span class="sd"> 'min_node_degree': minimum vertex degree of graphs in Gn.</span>
- <span class="sd"> 'max_node_degree': maximum vertex degree of graphs in Gn.</span>
- <span class="sd"> 'ave_fill_factor': average fill factor (number_of_edges / </span>
- <span class="sd"> (number_of_nodes ** 2)) of graphs in Gn.</span>
- <span class="sd"> 'min_fill_factor': minimum fill factor of graphs in Gn.</span>
- <span class="sd"> 'max_fill_factor': maximum fill factor of graphs in Gn.</span>
- <span class="sd"> 'node_label_num': number of symbolic vertex labels.</span>
- <span class="sd"> 'edge_label_num': number of symbolic edge labels.</span>
- <span class="sd"> 'node_attr_dim': number of dimensions of non-symbolic vertex labels. </span>
- <span class="sd"> Extracted from the 'attributes' attribute of graph nodes.</span>
- <span class="sd"> 'edge_attr_dim': number of dimensions of non-symbolic edge labels.</span>
- <span class="sd"> Extracted from the 'attributes' attribute of graph edges.</span>
- <span class="sd"> 'class_number': number of classes. Only available for classification </span>
- <span class="sd"> problems.</span>
- <span class="sd"> node_label : string</span>
- <span class="sd"> Node attribute used as label. The default node label is atom. Mandatory</span>
- <span class="sd"> when 'node_labeled' or 'node_label_num' is required.</span>
- <span class="sd"> edge_label : string</span>
- <span class="sd"> Edge attribute used as label. The default edge label is bond_type. </span>
- <span class="sd"> Mandatory when 'edge_labeled' or 'edge_label_num' is required.</span>
-
- <span class="sd"> Return</span>
- <span class="sd"> ------</span>
- <span class="sd"> attrs : dict</span>
- <span class="sd"> Value for each property.</span>
- <span class="sd"> """</span>
- <span class="kn">import</span> <span class="nn">networkx</span> <span class="k">as</span> <span class="nn">nx</span>
- <span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
-
- <span class="n">attrs</span> <span class="o">=</span> <span class="p">{}</span>
-
- <span class="k">def</span> <span class="nf">get_dataset_size</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">return</span> <span class="nb">len</span><span class="p">(</span><span class="n">Gn</span><span class="p">)</span>
-
- <span class="k">def</span> <span class="nf">get_all_node_num</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">return</span> <span class="p">[</span><span class="n">nx</span><span class="o">.</span><span class="n">number_of_nodes</span><span class="p">(</span><span class="n">G</span><span class="p">)</span> <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">]</span>
-
- <span class="k">def</span> <span class="nf">get_ave_node_num</span><span class="p">(</span><span class="n">all_node_num</span><span class="p">):</span>
- <span class="k">return</span> <span class="n">np</span><span class="o">.</span><span class="n">mean</span><span class="p">(</span><span class="n">all_node_num</span><span class="p">)</span>
-
- <span class="k">def</span> <span class="nf">get_min_node_num</span><span class="p">(</span><span class="n">all_node_num</span><span class="p">):</span>
- <span class="k">return</span> <span class="n">np</span><span class="o">.</span><span class="n">amin</span><span class="p">(</span><span class="n">all_node_num</span><span class="p">)</span>
-
- <span class="k">def</span> <span class="nf">get_max_node_num</span><span class="p">(</span><span class="n">all_node_num</span><span class="p">):</span>
- <span class="k">return</span> <span class="n">np</span><span class="o">.</span><span class="n">amax</span><span class="p">(</span><span class="n">all_node_num</span><span class="p">)</span>
-
- <span class="k">def</span> <span class="nf">get_all_edge_num</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">return</span> <span class="p">[</span><span class="n">nx</span><span class="o">.</span><span class="n">number_of_edges</span><span class="p">(</span><span class="n">G</span><span class="p">)</span> <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">]</span>
-
- <span class="k">def</span> <span class="nf">get_ave_edge_num</span><span class="p">(</span><span class="n">all_edge_num</span><span class="p">):</span>
- <span class="k">return</span> <span class="n">np</span><span class="o">.</span><span class="n">mean</span><span class="p">(</span><span class="n">all_edge_num</span><span class="p">)</span>
-
- <span class="k">def</span> <span class="nf">get_min_edge_num</span><span class="p">(</span><span class="n">all_edge_num</span><span class="p">):</span>
- <span class="k">return</span> <span class="n">np</span><span class="o">.</span><span class="n">amin</span><span class="p">(</span><span class="n">all_edge_num</span><span class="p">)</span>
-
- <span class="k">def</span> <span class="nf">get_max_edge_num</span><span class="p">(</span><span class="n">all_edge_num</span><span class="p">):</span>
- <span class="k">return</span> <span class="n">np</span><span class="o">.</span><span class="n">amax</span><span class="p">(</span><span class="n">all_edge_num</span><span class="p">)</span>
-
- <span class="k">def</span> <span class="nf">is_node_labeled</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">return</span> <span class="kc">False</span> <span class="k">if</span> <span class="n">node_label</span> <span class="ow">is</span> <span class="kc">None</span> <span class="k">else</span> <span class="kc">True</span>
-
- <span class="k">def</span> <span class="nf">get_node_label_num</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="n">nl</span> <span class="o">=</span> <span class="nb">set</span><span class="p">()</span>
- <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">:</span>
- <span class="n">nl</span> <span class="o">=</span> <span class="n">nl</span> <span class="o">|</span> <span class="nb">set</span><span class="p">(</span><span class="n">nx</span><span class="o">.</span><span class="n">get_node_attributes</span><span class="p">(</span><span class="n">G</span><span class="p">,</span> <span class="n">node_label</span><span class="p">)</span><span class="o">.</span><span class="n">values</span><span class="p">())</span>
- <span class="k">return</span> <span class="nb">len</span><span class="p">(</span><span class="n">nl</span><span class="p">)</span>
-
- <span class="k">def</span> <span class="nf">is_edge_labeled</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">return</span> <span class="kc">False</span> <span class="k">if</span> <span class="n">edge_label</span> <span class="ow">is</span> <span class="kc">None</span> <span class="k">else</span> <span class="kc">True</span>
-
- <span class="k">def</span> <span class="nf">get_edge_label_num</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="n">el</span> <span class="o">=</span> <span class="nb">set</span><span class="p">()</span>
- <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">:</span>
- <span class="n">el</span> <span class="o">=</span> <span class="n">el</span> <span class="o">|</span> <span class="nb">set</span><span class="p">(</span><span class="n">nx</span><span class="o">.</span><span class="n">get_edge_attributes</span><span class="p">(</span><span class="n">G</span><span class="p">,</span> <span class="n">edge_label</span><span class="p">)</span><span class="o">.</span><span class="n">values</span><span class="p">())</span>
- <span class="k">return</span> <span class="nb">len</span><span class="p">(</span><span class="n">el</span><span class="p">)</span>
-
- <span class="k">def</span> <span class="nf">is_directed</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">return</span> <span class="n">nx</span><span class="o">.</span><span class="n">is_directed</span><span class="p">(</span><span class="n">Gn</span><span class="p">[</span><span class="mi">0</span><span class="p">])</span>
-
- <span class="k">def</span> <span class="nf">get_ave_node_degree</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">return</span> <span class="n">np</span><span class="o">.</span><span class="n">mean</span><span class="p">([</span><span class="n">np</span><span class="o">.</span><span class="n">mean</span><span class="p">(</span><span class="nb">list</span><span class="p">(</span><span class="nb">dict</span><span class="p">(</span><span class="n">G</span><span class="o">.</span><span class="n">degree</span><span class="p">())</span><span class="o">.</span><span class="n">values</span><span class="p">()))</span> <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">])</span>
-
- <span class="k">def</span> <span class="nf">get_max_node_degree</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">return</span> <span class="n">np</span><span class="o">.</span><span class="n">amax</span><span class="p">([</span><span class="n">np</span><span class="o">.</span><span class="n">mean</span><span class="p">(</span><span class="nb">list</span><span class="p">(</span><span class="nb">dict</span><span class="p">(</span><span class="n">G</span><span class="o">.</span><span class="n">degree</span><span class="p">())</span><span class="o">.</span><span class="n">values</span><span class="p">()))</span> <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">])</span>
-
- <span class="k">def</span> <span class="nf">get_min_node_degree</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">return</span> <span class="n">np</span><span class="o">.</span><span class="n">amin</span><span class="p">([</span><span class="n">np</span><span class="o">.</span><span class="n">mean</span><span class="p">(</span><span class="nb">list</span><span class="p">(</span><span class="nb">dict</span><span class="p">(</span><span class="n">G</span><span class="o">.</span><span class="n">degree</span><span class="p">())</span><span class="o">.</span><span class="n">values</span><span class="p">()))</span> <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">])</span>
-
- <span class="c1"># get fill factor, the number of non-zero entries in the adjacency matrix.</span>
- <span class="k">def</span> <span class="nf">get_ave_fill_factor</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">return</span> <span class="n">np</span><span class="o">.</span><span class="n">mean</span><span class="p">([</span><span class="n">nx</span><span class="o">.</span><span class="n">number_of_edges</span><span class="p">(</span><span class="n">G</span><span class="p">)</span> <span class="o">/</span> <span class="p">(</span><span class="n">nx</span><span class="o">.</span><span class="n">number_of_nodes</span><span class="p">(</span><span class="n">G</span><span class="p">)</span>
- <span class="o">*</span> <span class="n">nx</span><span class="o">.</span><span class="n">number_of_nodes</span><span class="p">(</span><span class="n">G</span><span class="p">))</span> <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">])</span>
-
- <span class="k">def</span> <span class="nf">get_max_fill_factor</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">return</span> <span class="n">np</span><span class="o">.</span><span class="n">amax</span><span class="p">([</span><span class="n">nx</span><span class="o">.</span><span class="n">number_of_edges</span><span class="p">(</span><span class="n">G</span><span class="p">)</span> <span class="o">/</span> <span class="p">(</span><span class="n">nx</span><span class="o">.</span><span class="n">number_of_nodes</span><span class="p">(</span><span class="n">G</span><span class="p">)</span>
- <span class="o">*</span> <span class="n">nx</span><span class="o">.</span><span class="n">number_of_nodes</span><span class="p">(</span><span class="n">G</span><span class="p">))</span> <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">])</span>
-
- <span class="k">def</span> <span class="nf">get_min_fill_factor</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">return</span> <span class="n">np</span><span class="o">.</span><span class="n">amin</span><span class="p">([</span><span class="n">nx</span><span class="o">.</span><span class="n">number_of_edges</span><span class="p">(</span><span class="n">G</span><span class="p">)</span> <span class="o">/</span> <span class="p">(</span><span class="n">nx</span><span class="o">.</span><span class="n">number_of_nodes</span><span class="p">(</span><span class="n">G</span><span class="p">)</span>
- <span class="o">*</span> <span class="n">nx</span><span class="o">.</span><span class="n">number_of_nodes</span><span class="p">(</span><span class="n">G</span><span class="p">))</span> <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">])</span>
-
- <span class="k">def</span> <span class="nf">get_substructures</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="n">subs</span> <span class="o">=</span> <span class="nb">set</span><span class="p">()</span>
- <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">:</span>
- <span class="n">degrees</span> <span class="o">=</span> <span class="nb">list</span><span class="p">(</span><span class="nb">dict</span><span class="p">(</span><span class="n">G</span><span class="o">.</span><span class="n">degree</span><span class="p">())</span><span class="o">.</span><span class="n">values</span><span class="p">())</span>
- <span class="k">if</span> <span class="nb">any</span><span class="p">(</span><span class="n">i</span> <span class="o">==</span> <span class="mi">2</span> <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="n">degrees</span><span class="p">):</span>
- <span class="n">subs</span><span class="o">.</span><span class="n">add</span><span class="p">(</span><span class="s1">'linear'</span><span class="p">)</span>
- <span class="k">if</span> <span class="n">np</span><span class="o">.</span><span class="n">amax</span><span class="p">(</span><span class="n">degrees</span><span class="p">)</span> <span class="o">>=</span> <span class="mi">3</span><span class="p">:</span>
- <span class="n">subs</span><span class="o">.</span><span class="n">add</span><span class="p">(</span><span class="s1">'non linear'</span><span class="p">)</span>
- <span class="k">if</span> <span class="s1">'linear'</span> <span class="ow">in</span> <span class="n">subs</span> <span class="ow">and</span> <span class="s1">'non linear'</span> <span class="ow">in</span> <span class="n">subs</span><span class="p">:</span>
- <span class="k">break</span>
-
- <span class="k">if</span> <span class="n">is_directed</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">:</span>
- <span class="k">if</span> <span class="nb">len</span><span class="p">(</span><span class="nb">list</span><span class="p">(</span><span class="n">nx</span><span class="o">.</span><span class="n">find_cycle</span><span class="p">(</span><span class="n">G</span><span class="p">)))</span> <span class="o">></span> <span class="mi">0</span><span class="p">:</span>
- <span class="n">subs</span><span class="o">.</span><span class="n">add</span><span class="p">(</span><span class="s1">'cyclic'</span><span class="p">)</span>
- <span class="k">break</span>
- <span class="c1"># else:</span>
- <span class="c1"># # @todo: this method does not work for big graph with large amount of edges like D&D, try a better way.</span>
- <span class="c1"># upper = np.amin([nx.number_of_edges(G) for G in Gn]) * 2 + 10</span>
- <span class="c1"># for G in Gn:</span>
- <span class="c1"># if (nx.number_of_edges(G) < upper):</span>
- <span class="c1"># cyc = list(nx.simple_cycles(G.to_directed()))</span>
- <span class="c1"># if any(len(i) > 2 for i in cyc):</span>
- <span class="c1"># subs.add('cyclic')</span>
- <span class="c1"># break</span>
- <span class="c1"># if 'cyclic' not in subs:</span>
- <span class="c1"># for G in Gn:</span>
- <span class="c1"># cyc = list(nx.simple_cycles(G.to_directed()))</span>
- <span class="c1"># if any(len(i) > 2 for i in cyc):</span>
- <span class="c1"># subs.add('cyclic')</span>
- <span class="c1"># break</span>
-
- <span class="k">return</span> <span class="n">subs</span>
-
- <span class="k">def</span> <span class="nf">get_class_num</span><span class="p">(</span><span class="n">target</span><span class="p">):</span>
- <span class="k">return</span> <span class="nb">len</span><span class="p">(</span><span class="nb">set</span><span class="p">(</span><span class="n">target</span><span class="p">))</span>
-
- <span class="k">def</span> <span class="nf">get_node_attr_dim</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">:</span>
- <span class="k">for</span> <span class="n">n</span> <span class="ow">in</span> <span class="n">G</span><span class="o">.</span><span class="n">nodes</span><span class="p">(</span><span class="n">data</span><span class="o">=</span><span class="kc">True</span><span class="p">):</span>
- <span class="k">if</span> <span class="s1">'attributes'</span> <span class="ow">in</span> <span class="n">n</span><span class="p">[</span><span class="mi">1</span><span class="p">]:</span>
- <span class="k">return</span> <span class="nb">len</span><span class="p">(</span><span class="n">n</span><span class="p">[</span><span class="mi">1</span><span class="p">][</span><span class="s1">'attributes'</span><span class="p">])</span>
- <span class="k">return</span> <span class="mi">0</span>
-
- <span class="k">def</span> <span class="nf">get_edge_attr_dim</span><span class="p">(</span><span class="n">Gn</span><span class="p">):</span>
- <span class="k">for</span> <span class="n">G</span> <span class="ow">in</span> <span class="n">Gn</span><span class="p">:</span>
- <span class="k">if</span> <span class="n">nx</span><span class="o">.</span><span class="n">number_of_edges</span><span class="p">(</span><span class="n">G</span><span class="p">)</span> <span class="o">></span> <span class="mi">0</span><span class="p">:</span>
- <span class="k">for</span> <span class="n">e</span> <span class="ow">in</span> <span class="n">G</span><span class="o">.</span><span class="n">edges</span><span class="p">(</span><span class="n">data</span><span class="o">=</span><span class="kc">True</span><span class="p">):</span>
- <span class="k">if</span> <span class="s1">'attributes'</span> <span class="ow">in</span> <span class="n">e</span><span class="p">[</span><span class="mi">2</span><span class="p">]:</span>
- <span class="k">return</span> <span class="nb">len</span><span class="p">(</span><span class="n">e</span><span class="p">[</span><span class="mi">2</span><span class="p">][</span><span class="s1">'attributes'</span><span class="p">])</span>
- <span class="k">return</span> <span class="mi">0</span>
-
- <span class="k">if</span> <span class="n">attr_names</span> <span class="o">==</span> <span class="p">[]:</span>
- <span class="n">attr_names</span> <span class="o">=</span> <span class="p">[</span>
- <span class="s1">'substructures'</span><span class="p">,</span>
- <span class="s1">'node_labeled'</span><span class="p">,</span>
- <span class="s1">'edge_labeled'</span><span class="p">,</span>
- <span class="s1">'is_directed'</span><span class="p">,</span>
- <span class="s1">'dataset_size'</span><span class="p">,</span>
- <span class="s1">'ave_node_num'</span><span class="p">,</span>
- <span class="s1">'min_node_num'</span><span class="p">,</span>
- <span class="s1">'max_node_num'</span><span class="p">,</span>
- <span class="s1">'ave_edge_num'</span><span class="p">,</span>
- <span class="s1">'min_edge_num'</span><span class="p">,</span>
- <span class="s1">'max_edge_num'</span><span class="p">,</span>
- <span class="s1">'ave_node_degree'</span><span class="p">,</span>
- <span class="s1">'min_node_degree'</span><span class="p">,</span>
- <span class="s1">'max_node_degree'</span><span class="p">,</span>
- <span class="s1">'ave_fill_factor'</span><span class="p">,</span>
- <span class="s1">'min_fill_factor'</span><span class="p">,</span>
- <span class="s1">'max_fill_factor'</span><span class="p">,</span>
- <span class="s1">'node_label_num'</span><span class="p">,</span>
- <span class="s1">'edge_label_num'</span><span class="p">,</span>
- <span class="s1">'node_attr_dim'</span><span class="p">,</span>
- <span class="s1">'edge_attr_dim'</span><span class="p">,</span>
- <span class="s1">'class_number'</span><span class="p">,</span>
- <span class="p">]</span>
-
- <span class="c1"># dataset size</span>
- <span class="k">if</span> <span class="s1">'dataset_size'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
-
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'dataset_size'</span><span class="p">:</span> <span class="n">get_dataset_size</span><span class="p">(</span><span class="n">Gn</span><span class="p">)})</span>
-
- <span class="c1"># graph node number</span>
- <span class="k">if</span> <span class="nb">any</span><span class="p">(</span><span class="n">i</span> <span class="ow">in</span> <span class="n">attr_names</span>
- <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="p">[</span><span class="s1">'ave_node_num'</span><span class="p">,</span> <span class="s1">'min_node_num'</span><span class="p">,</span> <span class="s1">'max_node_num'</span><span class="p">]):</span>
-
- <span class="n">all_node_num</span> <span class="o">=</span> <span class="n">get_all_node_num</span><span class="p">(</span><span class="n">Gn</span><span class="p">)</span>
-
- <span class="k">if</span> <span class="s1">'ave_node_num'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
-
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'ave_node_num'</span><span class="p">:</span> <span class="n">get_ave_node_num</span><span class="p">(</span><span class="n">all_node_num</span><span class="p">)})</span>
-
- <span class="k">if</span> <span class="s1">'min_node_num'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
-
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'min_node_num'</span><span class="p">:</span> <span class="n">get_min_node_num</span><span class="p">(</span><span class="n">all_node_num</span><span class="p">)})</span>
-
- <span class="k">if</span> <span class="s1">'max_node_num'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
-
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'max_node_num'</span><span class="p">:</span> <span class="n">get_max_node_num</span><span class="p">(</span><span class="n">all_node_num</span><span class="p">)})</span>
-
- <span class="c1"># graph edge number</span>
- <span class="k">if</span> <span class="nb">any</span><span class="p">(</span><span class="n">i</span> <span class="ow">in</span> <span class="n">attr_names</span> <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span>
- <span class="p">[</span><span class="s1">'ave_edge_num'</span><span class="p">,</span> <span class="s1">'min_edge_num'</span><span class="p">,</span> <span class="s1">'max_edge_num'</span><span class="p">]):</span>
-
- <span class="n">all_edge_num</span> <span class="o">=</span> <span class="n">get_all_edge_num</span><span class="p">(</span><span class="n">Gn</span><span class="p">)</span>
-
- <span class="k">if</span> <span class="s1">'ave_edge_num'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
-
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'ave_edge_num'</span><span class="p">:</span> <span class="n">get_ave_edge_num</span><span class="p">(</span><span class="n">all_edge_num</span><span class="p">)})</span>
-
- <span class="k">if</span> <span class="s1">'max_edge_num'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
-
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'max_edge_num'</span><span class="p">:</span> <span class="n">get_max_edge_num</span><span class="p">(</span><span class="n">all_edge_num</span><span class="p">)})</span>
-
- <span class="k">if</span> <span class="s1">'min_edge_num'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
-
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'min_edge_num'</span><span class="p">:</span> <span class="n">get_min_edge_num</span><span class="p">(</span><span class="n">all_edge_num</span><span class="p">)})</span>
-
- <span class="c1"># label number</span>
- <span class="k">if</span> <span class="nb">any</span><span class="p">(</span><span class="n">i</span> <span class="ow">in</span> <span class="n">attr_names</span> <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="p">[</span><span class="s1">'node_labeled'</span><span class="p">,</span> <span class="s1">'node_label_num'</span><span class="p">]):</span>
- <span class="n">is_nl</span> <span class="o">=</span> <span class="n">is_node_labeled</span><span class="p">(</span><span class="n">Gn</span><span class="p">)</span>
- <span class="n">node_label_num</span> <span class="o">=</span> <span class="n">get_node_label_num</span><span class="p">(</span><span class="n">Gn</span><span class="p">)</span>
-
- <span class="k">if</span> <span class="s1">'node_labeled'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="c1"># graphs are considered node unlabeled if all nodes have the same label.</span>
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'node_labeled'</span><span class="p">:</span> <span class="n">is_nl</span> <span class="k">if</span> <span class="n">node_label_num</span> <span class="o">></span> <span class="mi">1</span> <span class="k">else</span> <span class="kc">False</span><span class="p">})</span>
-
- <span class="k">if</span> <span class="s1">'node_label_num'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'node_label_num'</span><span class="p">:</span> <span class="n">node_label_num</span><span class="p">})</span>
-
- <span class="k">if</span> <span class="nb">any</span><span class="p">(</span><span class="n">i</span> <span class="ow">in</span> <span class="n">attr_names</span> <span class="k">for</span> <span class="n">i</span> <span class="ow">in</span> <span class="p">[</span><span class="s1">'edge_labeled'</span><span class="p">,</span> <span class="s1">'edge_label_num'</span><span class="p">]):</span>
- <span class="n">is_el</span> <span class="o">=</span> <span class="n">is_edge_labeled</span><span class="p">(</span><span class="n">Gn</span><span class="p">)</span>
- <span class="n">edge_label_num</span> <span class="o">=</span> <span class="n">get_edge_label_num</span><span class="p">(</span><span class="n">Gn</span><span class="p">)</span>
-
- <span class="k">if</span> <span class="s1">'edge_labeled'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="c1"># graphs are considered edge unlabeled if all edges have the same label.</span>
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'edge_labeled'</span><span class="p">:</span> <span class="n">is_el</span> <span class="k">if</span> <span class="n">edge_label_num</span> <span class="o">></span> <span class="mi">1</span> <span class="k">else</span> <span class="kc">False</span><span class="p">})</span>
-
- <span class="k">if</span> <span class="s1">'edge_label_num'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'edge_label_num'</span><span class="p">:</span> <span class="n">edge_label_num</span><span class="p">})</span>
-
- <span class="k">if</span> <span class="s1">'is_directed'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'is_directed'</span><span class="p">:</span> <span class="n">is_directed</span><span class="p">(</span><span class="n">Gn</span><span class="p">)})</span>
-
- <span class="k">if</span> <span class="s1">'ave_node_degree'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'ave_node_degree'</span><span class="p">:</span> <span class="n">get_ave_node_degree</span><span class="p">(</span><span class="n">Gn</span><span class="p">)})</span>
-
- <span class="k">if</span> <span class="s1">'max_node_degree'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'max_node_degree'</span><span class="p">:</span> <span class="n">get_max_node_degree</span><span class="p">(</span><span class="n">Gn</span><span class="p">)})</span>
-
- <span class="k">if</span> <span class="s1">'min_node_degree'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'min_node_degree'</span><span class="p">:</span> <span class="n">get_min_node_degree</span><span class="p">(</span><span class="n">Gn</span><span class="p">)})</span>
-
- <span class="k">if</span> <span class="s1">'ave_fill_factor'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'ave_fill_factor'</span><span class="p">:</span> <span class="n">get_ave_fill_factor</span><span class="p">(</span><span class="n">Gn</span><span class="p">)})</span>
-
- <span class="k">if</span> <span class="s1">'max_fill_factor'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'max_fill_factor'</span><span class="p">:</span> <span class="n">get_max_fill_factor</span><span class="p">(</span><span class="n">Gn</span><span class="p">)})</span>
-
- <span class="k">if</span> <span class="s1">'min_fill_factor'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'min_fill_factor'</span><span class="p">:</span> <span class="n">get_min_fill_factor</span><span class="p">(</span><span class="n">Gn</span><span class="p">)})</span>
-
- <span class="k">if</span> <span class="s1">'substructures'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'substructures'</span><span class="p">:</span> <span class="n">get_substructures</span><span class="p">(</span><span class="n">Gn</span><span class="p">)})</span>
-
- <span class="k">if</span> <span class="s1">'class_number'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="n">attrs</span><span class="o">.</span><span class="n">update</span><span class="p">({</span><span class="s1">'class_number'</span><span class="p">:</span> <span class="n">get_class_num</span><span class="p">(</span><span class="n">target</span><span class="p">)})</span>
-
- <span class="k">if</span> <span class="s1">'node_attr_dim'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="n">attrs</span><span class="p">[</span><span class="s1">'node_attr_dim'</span><span class="p">]</span> <span class="o">=</span> <span class="n">get_node_attr_dim</span><span class="p">(</span><span class="n">Gn</span><span class="p">)</span>
-
- <span class="k">if</span> <span class="s1">'edge_attr_dim'</span> <span class="ow">in</span> <span class="n">attr_names</span><span class="p">:</span>
- <span class="n">attrs</span><span class="p">[</span><span class="s1">'edge_attr_dim'</span><span class="p">]</span> <span class="o">=</span> <span class="n">get_edge_attr_dim</span><span class="p">(</span><span class="n">Gn</span><span class="p">)</span>
-
- <span class="kn">from</span> <span class="nn">collections</span> <span class="k">import</span> <span class="n">OrderedDict</span>
- <span class="k">return</span> <span class="n">OrderedDict</span><span class="p">(</span>
- <span class="nb">sorted</span><span class="p">(</span><span class="n">attrs</span><span class="o">.</span><span class="n">items</span><span class="p">(),</span> <span class="n">key</span><span class="o">=</span><span class="k">lambda</span> <span class="n">i</span><span class="p">:</span> <span class="n">attr_names</span><span class="o">.</span><span class="n">index</span><span class="p">(</span><span class="n">i</span><span class="p">[</span><span class="mi">0</span><span class="p">])))</span></div>
- </pre></div>
-
- </div>
-
- </div>
- <footer>
-
-
- <hr/>
-
- <div role="contentinfo">
- <p>
- © Copyright 2020, Linlin Jia
-
- </p>
- </div>
- Built with <a href="http://sphinx-doc.org/">Sphinx</a> using a <a href="https://github.com/rtfd/sphinx_rtd_theme">theme</a> provided by <a href="https://readthedocs.org">Read the Docs</a>.
-
- </footer>
-
- </div>
- </div>
-
- </section>
-
- </div>
-
-
-
- <script type="text/javascript">
- jQuery(function () {
- SphinxRtdTheme.Navigation.enable(true);
- });
- </script>
-
-
-
-
-
-
- </body>
- </html>
|