@@ -12,21 +12,131 @@
"output_type": "stream",
"output_type": "stream",
"text": [
"text": [
"\n",
"\n",
"Acyclic:\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"is_directed : False\n",
"dataset_size : 183\n",
"ave_node_num : 8.153005464480874\n",
"min_node_num : 3\n",
"max_node_num : 11\n",
"ave_edge_num : 7.1530054644808745\n",
"min_edge_num : 2\n",
"max_edge_num : 10\n",
"ave_node_degree : 2.80327868852459\n",
"min_node_degree : 2\n",
"max_node_degree : 4\n",
"node_label_num : 3\n",
"edge_label_num : 1\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 148\n",
"\n",
"\n",
"Alkane:\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"is_directed : False\n",
"dataset_size : 150\n",
"ave_node_num : 8.873333333333333\n",
"min_node_num : 1\n",
"max_node_num : 10\n",
"ave_edge_num : 7.873333333333333\n",
"min_edge_num : 0\n",
"max_edge_num : 9\n",
"ave_node_degree : 3.36\n",
"min_node_degree : 0\n",
"max_node_degree : 4\n",
"node_label_num : 2\n",
"edge_label_num : 1\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 123\n",
"\n",
"\n",
"MAO:\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"edge_labeled : True\n",
"is_directed : False\n",
"dataset_size : 68\n",
"ave_node_num : 18.38235294117647\n",
"min_node_num : 11\n",
"max_node_num : 27\n",
"ave_edge_num : 19.63235294117647\n",
"min_edge_num : 12\n",
"max_edge_num : 29\n",
"ave_node_degree : 3.0\n",
"min_node_degree : 3\n",
"max_node_degree : 3\n",
"node_label_num : 3\n",
"edge_label_num : 4\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 2\n",
"\n",
"\n",
"PAH:\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"dataset_size : 94\n",
"ave_node_num : 20.70212765957447\n",
"min_node_num : 10\n",
"max_node_num : 28\n",
"ave_edge_num : 24.425531914893618\n",
"min_edge_num : 11\n",
"max_edge_num : 34\n",
"ave_node_degree : 3.0106382978723403\n",
"min_node_degree : 3\n",
"max_node_degree : 4\n",
"node_label_num : 1\n",
"edge_label_num : 1\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 2\n",
"\n",
"\n",
"MUTAG:\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"edge_labeled : True\n",
"is_directed : False\n",
"dataset_size : 188\n",
"ave_node_num : 17.930851063829788\n",
"min_node_num : 10\n",
"max_node_num : 28\n",
"ave_edge_num : 19.79255319148936\n",
"min_edge_num : 10\n",
"max_edge_num : 33\n",
"ave_node_degree : 3.00531914893617\n",
"min_node_degree : 3\n",
"max_node_degree : 4\n",
"node_label_num : 7\n",
"edge_label_num : 11\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 2\n",
"\n",
"\n",
"Letter-med:\n",
"Letter-med:\n",
"substructures : {'linear', 'non linear'}\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : False\n",
"node_labeled : False\n",
"edge_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 2250\n",
"dataset_size : 2250\n",
"ave_graph_size : 4.674666666666667\n",
"min_graph_size : 1\n",
"max_graph_size : 9\n",
"ave_graph_edge_num : 3.2057777777777776\n",
"min_graph_edge_num : 0\n",
"max_graph_edge_num : 7\n",
"ave_graph_degree : 2.012888888888889\n",
"min_graph_degree : 0\n",
"max_graph_degree : 4\n",
"ave_node_num : 4.674666666666667\n",
"min_node_num : 1\n",
"max_node_num : 9\n",
"ave_edge_num : 3.2057777777777776\n",
"min_edge_num : 0\n",
"max_edge_num : 7\n",
"ave_node _degree : 2.012888888888889\n",
"min_node _degree : 0\n",
"max_node _degree : 4\n",
"node_label_num : 0\n",
"node_label_num : 0\n",
"edge_label_num : 0\n",
"edge_label_num : 0\n",
"node_attr_dim : 2\n",
"node_attr_dim : 2\n",
@@ -34,21 +144,43 @@
"class_number : 15\n",
"class_number : 15\n",
"\n",
"\n",
"\n",
"\n",
"ENZYMES:\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"is_directed : False\n",
"dataset_size : 600\n",
"ave_node_num : 32.63333333333333\n",
"min_node_num : 2\n",
"max_node_num : 126\n",
"ave_edge_num : 62.13666666666666\n",
"min_edge_num : 1\n",
"max_edge_num : 149\n",
"ave_node_degree : 6.086666666666667\n",
"min_node_degree : 1\n",
"max_node_degree : 9\n",
"node_label_num : 3\n",
"edge_label_num : 0\n",
"node_attr_dim : 18\n",
"edge_attr_dim : 0\n",
"class_number : 6\n",
"\n",
"\n",
"Mutagenicity:\n",
"Mutagenicity:\n",
"substructures : {'linear', 'non linear'}\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"node_labeled : True\n",
"edge_labeled : True\n",
"edge_labeled : True\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 4337\n",
"dataset_size : 4337\n",
"ave_graph_size : 30.317731150564907\n",
"min_graph_size : 4\n",
"max_graph_size : 417\n",
"ave_graph_edge_num : 30.76942587041734\n",
"min_graph_edge_num : 3\n",
"max_graph_edge_num : 112\n",
"ave_graph_degree : 3.75651371916071\n",
"min_graph_degree : 3\n",
"max_graph_degree : 4\n",
"ave_node_num : 30.317731150564907\n",
"min_node_num : 4\n",
"max_node_num : 417\n",
"ave_edge_num : 30.76942587041734\n",
"min_edge_num : 3\n",
"max_edge_num : 112\n",
"ave_node _degree : 3.75651371916071\n",
"min_node _degree : 3\n",
"max_node _degree : 4\n",
"node_label_num : 14\n",
"node_label_num : 14\n",
"edge_label_num : 3\n",
"edge_label_num : 3\n",
"node_attr_dim : 0\n",
"node_attr_dim : 0\n",
@@ -56,21 +188,43 @@
"class_number : 2\n",
"class_number : 2\n",
"\n",
"\n",
"\n",
"\n",
"D&D:\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"is_directed : False\n",
"dataset_size : 1178\n",
"ave_node_num : 284.3166383701188\n",
"min_node_num : 30\n",
"max_node_num : 5748\n",
"ave_edge_num : 715.6587436332767\n",
"min_edge_num : 63\n",
"max_edge_num : 14267\n",
"ave_node_degree : 9.509337860780985\n",
"min_node_degree : 6\n",
"max_node_degree : 19\n",
"node_label_num : 82\n",
"edge_label_num : 0\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 2\n",
"\n",
"\n",
"AIDS:\n",
"AIDS:\n",
"substructures : {'linear', 'non linear'}\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"node_labeled : True\n",
"edge_labeled : True\n",
"edge_labeled : True\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 2000\n",
"dataset_size : 2000\n",
"ave_graph_size : 15.6925\n",
"min_graph_size : 2\n",
"max_graph_size : 95\n",
"ave_graph_edge_num : 16.195\n",
"min_graph_edge_num : 1\n",
"max_graph_edge_num : 103\n",
"ave_graph_degree : 3.322\n",
"min_graph_degree : 1\n",
"max_graph_degree : 6\n",
"ave_node_num : 15.6925\n",
"min_node_num : 2\n",
"max_node_num : 95\n",
"ave_edge_num : 16.195\n",
"min_edge_num : 1\n",
"max_edge_num : 103\n",
"ave_node _degree : 3.322\n",
"min_node _degree : 1\n",
"max_node _degree : 6\n",
"node_label_num : 38\n",
"node_label_num : 38\n",
"edge_label_num : 3\n",
"edge_label_num : 3\n",
"node_attr_dim : 4\n",
"node_attr_dim : 4\n",
@@ -84,15 +238,15 @@
"edge_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 41\n",
"dataset_size : 41\n",
"ave_graph_size : 1377.2682926829268\n",
"min_graph_size : 134\n",
"max_graph_size : 5037\n",
"ave_graph_ edge_num : 3074.0975609756097\n",
"min_graph_ edge_num : 320\n",
"max_graph_ edge_num : 10888\n",
"ave_graph _degree : 7.853658536585366\n",
"min_graph _degree : 6\n",
"max_graph _degree : 10\n",
"ave_node_num : 1377.2682926829268\n",
"min_node_num : 134\n",
"max_node_num : 5037\n",
"ave_edge_num : 3074.0975609756097\n",
"min_edge_num : 320\n",
"max_edge_num : 10888\n",
"ave_node _degree : 7.853658536585366\n",
"min_node _degree : 6\n",
"max_node _degree : 10\n",
"node_label_num : 5\n",
"node_label_num : 5\n",
"edge_label_num : 0\n",
"edge_label_num : 0\n",
"node_attr_dim : 1\n",
"node_attr_dim : 1\n",
@@ -101,20 +255,20 @@
"\n",
"\n",
"\n",
"\n",
"MSRC9:\n",
"MSRC9:\n",
"substructures : {'linear', 'non linear'}\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 221\n",
"dataset_size : 221\n",
"ave_graph_size : 40.57918552036199\n",
"min_graph_size : 25\n",
"max_graph_size : 55\n",
"ave_graph_ edge_num : 97.9366515837104\n",
"min_graph_ edge_num : 53\n",
"max_graph_ edge_num : 145\n",
"ave_graph _degree : 10.158371040723981\n",
"min_graph _degree : 8\n",
"max_graph _degree : 16\n",
"ave_node_num : 40.57918552036199\n",
"min_node_num : 25\n",
"max_node_num : 55\n",
"ave_edge_num : 97.9366515837104\n",
"min_edge_num : 53\n",
"max_edge_num : 145\n",
"ave_node _degree : 10.158371040723981\n",
"min_node _degree : 8\n",
"max_node _degree : 16\n",
"node_label_num : 10\n",
"node_label_num : 10\n",
"edge_label_num : 0\n",
"edge_label_num : 0\n",
"node_attr_dim : 0\n",
"node_attr_dim : 0\n",
@@ -123,20 +277,20 @@
"\n",
"\n",
"\n",
"\n",
"MSRC21:\n",
"MSRC21:\n",
"substructures : {'linear', 'non linear'}\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 563\n",
"dataset_size : 563\n",
"ave_graph_size : 77.52042628774423\n",
"min_graph_size : 51\n",
"max_graph_size : 141\n",
"ave_graph_ edge_num : 198.32326820603907\n",
"min_graph_ edge_num : 121\n",
"max_graph_ edge_num : 405\n",
"ave_graph _degree : 11.41563055062167\n",
"min_graph _degree : 8\n",
"max_graph _degree : 23\n",
"ave_node_num : 77.52042628774423\n",
"min_node_num : 51\n",
"max_node_num : 141\n",
"ave_edge_num : 198.32326820603907\n",
"min_edge_num : 121\n",
"max_edge_num : 405\n",
"ave_node _degree : 11.41563055062167\n",
"min_node _degree : 8\n",
"max_node _degree : 23\n",
"node_label_num : 22\n",
"node_label_num : 22\n",
"edge_label_num : 0\n",
"edge_label_num : 0\n",
"node_attr_dim : 0\n",
"node_attr_dim : 0\n",
@@ -145,20 +299,20 @@
"\n",
"\n",
"\n",
"\n",
"SYNTHETIC:\n",
"SYNTHETIC:\n",
"substructures : {'linear', 'non linear'}\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 300\n",
"dataset_size : 300\n",
"ave_graph_size : 100.0\n",
"min_graph_size : 100\n",
"max_graph_size : 100\n",
"ave_graph_ edge_num : 196.0\n",
"min_graph_ edge_num : 196\n",
"max_graph_ edge_num : 196\n",
"ave_graph _degree : 8.0\n",
"min_graph _degree : 8\n",
"max_graph _degree : 8\n",
"ave_node_num : 100.0\n",
"min_node_num : 100\n",
"max_node_num : 100\n",
"ave_edge_num : 196.0\n",
"min_edge_num : 196\n",
"max_edge_num : 196\n",
"ave_node _degree : 8.0\n",
"min_node _degree : 8\n",
"max_node _degree : 8\n",
"node_label_num : 8\n",
"node_label_num : 8\n",
"edge_label_num : 0\n",
"edge_label_num : 0\n",
"node_attr_dim : 1\n",
"node_attr_dim : 1\n",
@@ -167,20 +321,20 @@
"\n",
"\n",
"\n",
"\n",
"BZR:\n",
"BZR:\n",
"substructures : {'linear', 'non linear'}\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 405\n",
"dataset_size : 405\n",
"ave_graph_size : 35.75061728395062\n",
"min_graph_size : 13\n",
"max_graph_size : 57\n",
"ave_graph_ edge_num : 38.358024691358025\n",
"min_graph_ edge_num : 13\n",
"max_graph_ edge_num : 60\n",
"ave_graph _degree : 3.8641975308641974\n",
"min_graph _degree : 3\n",
"max_graph _degree : 4\n",
"ave_node_num : 35.75061728395062\n",
"min_node_num : 13\n",
"max_node_num : 57\n",
"ave_edge_num : 38.358024691358025\n",
"min_edge_num : 13\n",
"max_edge_num : 60\n",
"ave_node _degree : 3.8641975308641974\n",
"min_node _degree : 3\n",
"max_node _degree : 4\n",
"node_label_num : 10\n",
"node_label_num : 10\n",
"edge_label_num : 0\n",
"edge_label_num : 0\n",
"node_attr_dim : 3\n",
"node_attr_dim : 3\n",
@@ -189,20 +343,20 @@
"\n",
"\n",
"\n",
"\n",
"COX2:\n",
"COX2:\n",
"substructures : {'linear', 'non linear'}\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 467\n",
"dataset_size : 467\n",
"ave_graph_size : 41.224839400428266\n",
"min_graph_size : 32\n",
"max_graph_size : 56\n",
"ave_graph_ edge_num : 43.44539614561028\n",
"min_graph_ edge_num : 34\n",
"max_graph_ edge_num : 59\n",
"ave_graph _degree : 4.0\n",
"min_graph _degree : 4\n",
"max_graph _degree : 4\n",
"ave_node_num : 41.224839400428266\n",
"min_node_num : 32\n",
"max_node_num : 56\n",
"ave_edge_num : 43.44539614561028\n",
"min_edge_num : 34\n",
"max_edge_num : 59\n",
"ave_node _degree : 4.0\n",
"min_node _degree : 4\n",
"max_node _degree : 4\n",
"node_label_num : 8\n",
"node_label_num : 8\n",
"edge_label_num : 0\n",
"edge_label_num : 0\n",
"node_attr_dim : 3\n",
"node_attr_dim : 3\n",
@@ -211,20 +365,20 @@
"\n",
"\n",
"\n",
"\n",
"DHFR:\n",
"DHFR:\n",
"substructures : {'linear', 'non linear'}\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 756\n",
"dataset_size : 756\n",
"ave_graph_size : 42.42724867724868\n",
"min_graph_size : 20\n",
"max_graph_size : 71\n",
"ave_graph_ edge_num : 44.544973544973544\n",
"min_graph_ edge_num : 21\n",
"max_graph_ edge_num : 73\n",
"ave_graph _degree : 3.955026455026455\n",
"min_graph _degree : 3\n",
"max_graph _degree : 4\n",
"ave_node_num : 42.42724867724868\n",
"min_node_num : 20\n",
"max_node_num : 71\n",
"ave_edge_num : 44.544973544973544\n",
"min_edge_num : 21\n",
"max_edge_num : 73\n",
"ave_node _degree : 3.955026455026455\n",
"min_node _degree : 3\n",
"max_node _degree : 4\n",
"node_label_num : 9\n",
"node_label_num : 9\n",
"edge_label_num : 0\n",
"edge_label_num : 0\n",
"node_attr_dim : 3\n",
"node_attr_dim : 3\n",
@@ -232,43 +386,21 @@
"class_number : 2\n",
"class_number : 2\n",
"\n",
"\n",
"\n",
"\n",
"ENZYMES:\n",
"substructures : {'linear', 'non linear'}\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"is_directed : False\n",
"dataset_size : 600\n",
"ave_graph_size : 32.63333333333333\n",
"min_graph_size : 2\n",
"max_graph_size : 126\n",
"ave_graph_edge_num : 62.13666666666666\n",
"min_graph_edge_num : 1\n",
"max_graph_edge_num : 149\n",
"ave_graph_degree : 6.086666666666667\n",
"min_graph_degree : 1\n",
"max_graph_degree : 9\n",
"node_label_num : 3\n",
"edge_label_num : 0\n",
"node_attr_dim : 18\n",
"edge_attr_dim : 0\n",
"class_number : 6\n",
"\n",
"\n",
"PROTEINS:\n",
"PROTEINS:\n",
"substructures : {'linear', 'non linear'}\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 1113\n",
"dataset_size : 1113\n",
"ave_graph_size : 39.05750224618149\n",
"min_graph_size : 4\n",
"max_graph_size : 620\n",
"ave_graph_ edge_num : 72.8158131176999\n",
"min_graph_ edge_num : 5\n",
"max_graph_ edge_num : 1049\n",
"ave_graph _degree : 5.794249775381851\n",
"min_graph _degree : 3\n",
"max_graph _degree : 25\n",
"ave_node_num : 39.05750224618149\n",
"min_node_num : 4\n",
"max_node_num : 620\n",
"ave_edge_num : 72.8158131176999\n",
"min_edge_num : 5\n",
"max_edge_num : 1049\n",
"ave_node_degree : 5.794249775381851\n",
"min_node_degree : 3\n",
"max_node_degree : 25\n",
"node_label_num : 3\n",
"node_label_num : 3\n",
"edge_label_num : 0\n",
"edge_label_num : 0\n",
"node_attr_dim : 1\n",
"node_attr_dim : 1\n",
@@ -277,135 +409,25 @@
"\n",
"\n",
"\n",
"\n",
"PROTEINS_full:\n",
"PROTEINS_full:\n",
"substructures : {'linear', 'non linear'}\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 1113\n",
"dataset_size : 1113\n",
"ave_graph_size : 39.05750224618149\n",
"min_graph_size : 4\n",
"max_graph_size : 620\n",
"ave_graph_ edge_num : 72.8158131176999\n",
"min_graph_ edge_num : 5\n",
"max_graph_ edge_num : 1049\n",
"ave_graph _degree : 5.794249775381851\n",
"min_graph _degree : 3\n",
"max_graph _degree : 25\n",
"ave_node_num : 39.05750224618149\n",
"min_node_num : 4\n",
"max_node_num : 620\n",
"ave_edge_num : 72.8158131176999\n",
"min_edge_num : 5\n",
"max_edge_num : 1049\n",
"ave_node _degree : 5.794249775381851\n",
"min_node _degree : 3\n",
"max_node _degree : 25\n",
"node_label_num : 3\n",
"node_label_num : 3\n",
"edge_label_num : 0\n",
"edge_label_num : 0\n",
"node_attr_dim : 29\n",
"node_attr_dim : 29\n",
"edge_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 2\n",
"class_number : 2\n",
"\n",
"\n",
"D&D:\n",
"substructures : {'linear', 'non linear'}\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"is_directed : False\n",
"dataset_size : 1178\n",
"ave_graph_size : 284.3166383701188\n",
"min_graph_size : 30\n",
"max_graph_size : 5748\n",
"ave_graph_edge_num : 715.6587436332767\n",
"min_graph_edge_num : 63\n",
"max_graph_edge_num : 14267\n",
"ave_graph_degree : 9.509337860780985\n",
"min_graph_degree : 6\n",
"max_graph_degree : 19\n",
"node_label_num : 82\n",
"edge_label_num : 0\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 2\n",
"\n",
"\n",
"MUTAG:\n",
"substructures : {'linear', 'non linear'}\n",
"node_labeled : True\n",
"edge_labeled : True\n",
"is_directed : False\n",
"dataset_size : 188\n",
"ave_graph_size : 17.930851063829788\n",
"min_graph_size : 10\n",
"max_graph_size : 28\n",
"ave_graph_edge_num : 19.79255319148936\n",
"min_graph_edge_num : 10\n",
"max_graph_edge_num : 33\n",
"ave_graph_degree : 3.00531914893617\n",
"min_graph_degree : 3\n",
"max_graph_degree : 4\n",
"node_label_num : 7\n",
"edge_label_num : 11\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 2\n",
"\n",
"\n",
"Alkane:\n",
"substructures : {'linear', 'non linear'}\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"is_directed : False\n",
"dataset_size : 150\n",
"ave_graph_size : 8.873333333333333\n",
"min_graph_size : 1\n",
"max_graph_size : 10\n",
"ave_graph_edge_num : 7.873333333333333\n",
"min_graph_edge_num : 0\n",
"max_graph_edge_num : 9\n",
"ave_graph_degree : 3.36\n",
"min_graph_degree : 0\n",
"max_graph_degree : 4\n",
"node_label_num : 2\n",
"edge_label_num : 1\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 123\n",
"\n",
"\n",
"Acyclic:\n",
"substructures : {'linear', 'non linear'}\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"is_directed : False\n",
"dataset_size : 183\n",
"ave_graph_size : 8.153005464480874\n",
"min_graph_size : 3\n",
"max_graph_size : 11\n",
"ave_graph_edge_num : 7.1530054644808745\n",
"min_graph_edge_num : 2\n",
"max_graph_edge_num : 10\n",
"ave_graph_degree : 2.80327868852459\n",
"min_graph_degree : 2\n",
"max_graph_degree : 4\n",
"node_label_num : 3\n",
"edge_label_num : 1\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 148\n",
"\n",
"\n",
"MAO:\n",
"substructures : {'linear', 'non linear'}\n",
"node_labeled : True\n",
"edge_labeled : True\n",
"is_directed : False\n",
"dataset_size : 68\n",
"ave_graph_size : 18.38235294117647\n",
"min_graph_size : 11\n",
"max_graph_size : 27\n",
"ave_graph_edge_num : 19.63235294117647\n",
"min_graph_edge_num : 12\n",
"max_graph_edge_num : 29\n",
"ave_graph_degree : 3.0\n",
"min_graph_degree : 3\n",
"max_graph_degree : 3\n",
"node_label_num : 3\n",
"edge_label_num : 4\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 2\n",
"\n"
"\n"
]
]
},
},
@@ -414,43 +436,21 @@
"output_type": "stream",
"output_type": "stream",
"text": [
"text": [
"\n",
"\n",
"PAH:\n",
"substructures : {'linear', 'non linear'}\n",
"node_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"dataset_size : 94\n",
"ave_graph_size : 20.70212765957447\n",
"min_graph_size : 10\n",
"max_graph_size : 28\n",
"ave_graph_edge_num : 24.425531914893618\n",
"min_graph_edge_num : 11\n",
"max_graph_edge_num : 34\n",
"ave_graph_degree : 3.0106382978723403\n",
"min_graph_degree : 3\n",
"max_graph_degree : 4\n",
"node_label_num : 1\n",
"edge_label_num : 1\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 2\n",
"\n",
"\n",
"NCI1:\n",
"NCI1:\n",
"substructures : {'linear', 'non linear'}\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 4110\n",
"dataset_size : 4110\n",
"ave_graph_size : 29.8654501216545\n",
"min_graph_size : 3\n",
"max_graph_size : 111\n",
"ave_graph_ edge_num : 32.3\n",
"min_graph_ edge_num : 2\n",
"max_graph_ edge_num : 119\n",
"ave_graph _degree : 3.3360097323600972\n",
"min_graph _degree : 2\n",
"max_graph _degree : 4\n",
"ave_node_num : 29.8654501216545\n",
"min_node_num : 3\n",
"max_node_num : 111\n",
"ave_edge_num : 32.3\n",
"min_edge_num : 2\n",
"max_edge_num : 119\n",
"ave_node_degree : 3.3360097323600972\n",
"min_node_degree : 2\n",
"max_node_degree : 4\n",
"node_label_num : 37\n",
"node_label_num : 37\n",
"edge_label_num : 0\n",
"edge_label_num : 0\n",
"node_attr_dim : 0\n",
"node_attr_dim : 0\n",
@@ -459,39 +459,51 @@
"\n",
"\n",
"\n",
"\n",
"NCI109:\n",
"NCI109:\n",
"substructures : {'linear', 'non linear'}\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"node_labeled : True\n",
"edge_labeled : False\n",
"edge_labeled : False\n",
"is_directed : False\n",
"is_directed : False\n",
"dataset_size : 4127\n",
"dataset_size : 4127\n",
"ave_graph_size : 29.681124303368065\n",
"min_graph_size : 4\n",
"max_graph_size : 111\n",
"ave_graph_ edge_num : 32.13084565059365\n",
"min_graph_ edge_num : 3\n",
"max_graph_ edge_num : 119\n",
"ave_graph _degree : 3.343833292948873\n",
"min_graph _degree : 2\n",
"max_graph _degree : 5\n",
"ave_node_num : 29.681124303368065\n",
"min_node_num : 4\n",
"max_node_num : 111\n",
"ave_edge_num : 32.13084565059365\n",
"min_edge_num : 3\n",
"max_edge_num : 119\n",
"ave_node _degree : 3.343833292948873\n",
"min_node _degree : 2\n",
"max_node _degree : 5\n",
"node_label_num : 38\n",
"node_label_num : 38\n",
"edge_label_num : 0\n",
"edge_label_num : 0\n",
"node_attr_dim : 0\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 2\n",
"class_number : 2\n",
"\n",
"load SDF: 100%|██████████| 4457424/4457424 [00:10<00:00, 430440.94it/s]\n",
"ajust data: 100%|██████████| 42687/42687 [00:09<00:00, 4352.25it/s] \n",
"\n",
"NCI-HIV:\n",
"substructures : {'non linear', 'linear'}\n",
"node_labeled : True\n",
"edge_labeled : True\n",
"is_directed : False\n",
"dataset_size : 42682\n",
"ave_node_num : 45.70945597675835\n",
"min_node_num : 2\n",
"max_node_num : 438\n",
"ave_edge_num : 47.7137903565906\n",
"min_edge_num : 1\n",
"max_edge_num : 441\n",
"ave_node_degree : 3.9760554800618526\n",
"min_node_degree : 1\n",
"max_node_degree : 12\n",
"node_label_num : 63\n",
"edge_label_num : 3\n",
"node_attr_dim : 0\n",
"edge_attr_dim : 0\n",
"class_number : 3\n",
"\n"
"\n"
]
]
},
{
"ename": "ModuleNotFoundError",
"evalue": "No module named 'tqdm'",
"output_type": "error",
"traceback": [
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
"\u001b[0;31mModuleNotFoundError\u001b[0m Traceback (most recent call last)",
"\u001b[0;32m<ipython-input-1-1e4da065c026>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[1;32m 45\u001b[0m \u001b[0mds\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'dataset'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 46\u001b[0m \u001b[0mfilename_y\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mds\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'dataset_y'\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0;34m'dataset_y'\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mds\u001b[0m \u001b[0;32melse\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 47\u001b[0;31m extra_params=(ds['extra_params'] if 'extra_params' in ds else None))\n\u001b[0m\u001b[1;32m 48\u001b[0m attrs = get_dataset_attributes(\n\u001b[1;32m 49\u001b[0m dataset, target=y, node_label='atom', edge_label='bond_type')\n",
"\u001b[0;32m/media/ljia/DATA/research-repo/codes/Linlin/py-graph/pygraph/utils/graphfiles.py\u001b[0m in \u001b[0;36mloadDataset\u001b[0;34m(filename, filename_y, extra_params)\u001b[0m\n\u001b[1;32m 377\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0mextension\u001b[0m \u001b[0;34m==\u001b[0m \u001b[0;34m\"sdf\"\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 378\u001b[0m \u001b[0;32mimport\u001b[0m \u001b[0mnumpy\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0mnp\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 379\u001b[0;31m \u001b[0;32mfrom\u001b[0m \u001b[0mtqdm\u001b[0m \u001b[0;32mimport\u001b[0m \u001b[0mtqdm\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 380\u001b[0m \u001b[0;32mimport\u001b[0m \u001b[0msys\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 381\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n",
"\u001b[0;31mModuleNotFoundError\u001b[0m: No module named 'tqdm'"
]
}
}
],
],
"source": [
"source": [
@@ -501,8 +513,18 @@
"from pygraph.utils.graphdataset import get_dataset_attributes\n",
"from pygraph.utils.graphdataset import get_dataset_attributes\n",
"\n",
"\n",
"dslist = [\n",
"dslist = [\n",
" {'name': 'Acyclic', 'dataset': '../datasets/acyclic/dataset_bps.ds',},\n",
" {'name': 'Alkane', 'dataset': '../datasets/Alkane/dataset.ds',\n",
" 'dataset_y': '../datasets/Alkane/dataset_boiling_point_names.txt',},\n",
" {'name': 'MAO', 'dataset': '../datasets/MAO/dataset.ds',},\n",
" {'name': 'PAH', 'dataset': '../datasets/PAH/dataset.ds',},\n",
" {'name': 'MUTAG', 'dataset': '../datasets/MUTAG/MUTAG.mat',\n",
" 'extra_params': {'am_sp_al_nl_el': [0, 0, 3, 1, 2]}},\n",
" {'name': 'Letter-med', 'dataset': '../datasets/Letter-med/Letter-med_A.txt'},\n",
" {'name': 'Letter-med', 'dataset': '../datasets/Letter-med/Letter-med_A.txt'},\n",
" {'name': 'ENZYMES', 'dataset': '../datasets/ENZYMES_txt/ENZYMES_A_sparse.txt'},\n",
" {'name': 'Mutagenicity', 'dataset': '../datasets/Mutagenicity/Mutagenicity_A.txt'},\n",
" {'name': 'Mutagenicity', 'dataset': '../datasets/Mutagenicity/Mutagenicity_A.txt'},\n",
" {'name': 'D&D', 'dataset': '../datasets/D&D/DD.mat',\n",
" 'extra_params': {'am_sp_al_nl_el': [0, 1, 2, 1, -1]}},\n",
" {'name': 'AIDS', 'dataset': '../datasets/AIDS/AIDS_A.txt'},\n",
" {'name': 'AIDS', 'dataset': '../datasets/AIDS/AIDS_A.txt'},\n",
" {'name': 'FIRSTMM_DB', 'dataset': '../datasets/FIRSTMM_DB/FIRSTMM_DB_A.txt'},\n",
" {'name': 'FIRSTMM_DB', 'dataset': '../datasets/FIRSTMM_DB/FIRSTMM_DB_A.txt'},\n",
" {'name': 'MSRC9', 'dataset': '../datasets/MSRC_9_txt/MSRC_9_A.txt'},\n",
" {'name': 'MSRC9', 'dataset': '../datasets/MSRC_9_txt/MSRC_9_A.txt'},\n",
@@ -510,19 +532,9 @@
" {'name': 'SYNTHETIC', 'dataset': '../datasets/SYNTHETIC_txt/SYNTHETIC_A_sparse.txt'},\n",
" {'name': 'SYNTHETIC', 'dataset': '../datasets/SYNTHETIC_txt/SYNTHETIC_A_sparse.txt'},\n",
" {'name': 'BZR', 'dataset': '../datasets/BZR_txt/BZR_A_sparse.txt'},\n",
" {'name': 'BZR', 'dataset': '../datasets/BZR_txt/BZR_A_sparse.txt'},\n",
" {'name': 'COX2', 'dataset': '../datasets/COX2_txt/COX2_A_sparse.txt'},\n",
" {'name': 'COX2', 'dataset': '../datasets/COX2_txt/COX2_A_sparse.txt'},\n",
" {'name': 'DHFR', 'dataset': '../datasets/DHFR_txt/DHFR_A_sparse.txt'},\n",
" {'name': 'ENZYMES', 'dataset': '../datasets/ENZYMES_txt/ENZYMES_A_sparse.txt'},\n",
" {'name': 'DHFR', 'dataset': '../datasets/DHFR_txt/DHFR_A_sparse.txt'}, \n",
" {'name': 'PROTEINS', 'dataset': '../datasets/PROTEINS_txt/PROTEINS_A_sparse.txt'},\n",
" {'name': 'PROTEINS', 'dataset': '../datasets/PROTEINS_txt/PROTEINS_A_sparse.txt'},\n",
" {'name': 'PROTEINS_full', 'dataset': '../datasets/PROTEINS_full_txt/PROTEINS_full_A_sparse.txt'},\n",
" {'name': 'D&D', 'dataset': '../datasets/D&D/DD.mat',\n",
" 'extra_params': {'am_sp_al_nl_el': [0, 1, 2, 1, -1]}},\n",
" {'name': 'MUTAG', 'dataset': '../datasets/MUTAG/MUTAG.mat',\n",
" 'extra_params': {'am_sp_al_nl_el': [0, 0, 3, 1, 2]}},\n",
" {'name': 'Alkane', 'dataset': '../datasets/Alkane/dataset.ds',\n",
" 'dataset_y': '../datasets/Alkane/dataset_boiling_point_names.txt',},\n",
" {'name': 'Acyclic', 'dataset': '../datasets/acyclic/dataset_bps.ds',},\n",
" {'name': 'MAO', 'dataset': '../datasets/MAO/dataset.ds',},\n",
" {'name': 'PAH', 'dataset': '../datasets/PAH/dataset.ds',},\n",
" {'name': 'PROTEINS_full', 'dataset': '../datasets/PROTEINS_full_txt/PROTEINS_full_A_sparse.txt'}, \n",
" {'name': 'NCI1', 'dataset': '../datasets/NCI1/NCI1.mat',\n",
" {'name': 'NCI1', 'dataset': '../datasets/NCI1/NCI1.mat',\n",
" 'extra_params': {'am_sp_al_nl_el': [1, 1, 2, 0, -1]}},\n",
" 'extra_params': {'am_sp_al_nl_el': [1, 1, 2, 0, -1]}},\n",
" {'name': 'NCI109', 'dataset': '../datasets/NCI109/NCI109.mat',\n",
" {'name': 'NCI109', 'dataset': '../datasets/NCI109/NCI109.mat',\n",