You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

metadata.py 65 kB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485248624872488
  1. #!/usr/bin/env python3
  2. # -*- coding: utf-8 -*-
  3. """
  4. Created on Tue Oct 20 14:25:49 2020
  5. @author: ljia
  6. """
  7. DATABASES = {
  8. 'greyc': 'https://brunl01.users.greyc.fr/CHEMISTRY/',
  9. 'iam': 'https://iapr-tc15.greyc.fr/IAM/',
  10. 'tudataset': 'http://graphlearning.io/docs/datasets/',
  11. }
  12. ### -------- database greyc -------- ###
  13. GREYC_META = {
  14. 'ACE': {
  15. 'database': 'greyc',
  16. 'reference': None,
  17. 'dataset_size': 32,
  18. 'class_number': 2,
  19. 'task_type': 'classification',
  20. 'ave_node_num': 52,
  21. 'ave_edge_num': None,
  22. 'node_labeled': None,
  23. 'edge_labeled': None,
  24. 'node_attr_dim': None,
  25. 'geometry': None,
  26. 'edge_attr_dim': None,
  27. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/ACEDataset.tar',
  28. 'domain': 'small molecules',
  29. 'train_valid_test': [],
  30. 'stereoisomerism': True,
  31. 'load_files': ['data.ds'],
  32. 'extra_params': {'gformat': 'cml'}
  33. },
  34. 'Acyclic': {
  35. 'database': 'greyc',
  36. 'reference': None,
  37. 'dataset_size': 183,
  38. 'class_number': None,
  39. 'task_type': 'regression',
  40. 'ave_node_num': 8.15,
  41. 'ave_edge_num': 7.15,
  42. 'node_labeled': True,
  43. 'edge_labeled': False,
  44. 'node_attr_dim': 0,
  45. 'geometry': None,
  46. 'edge_attr_dim': 0,
  47. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/Acyclic.tar.gz',
  48. 'domain': 'small molecules',
  49. 'train_valid_test': None,
  50. 'stereoisomerism': False,
  51. 'load_files': ['dataset_bps.ds'],
  52. },
  53. 'AIDS_greyc': {
  54. 'database': 'greyc',
  55. 'reference': None,
  56. 'dataset_size': 2000,
  57. 'class_number': 2,
  58. 'task_type': 'classification',
  59. 'ave_node_num': 15.69,
  60. 'ave_edge_num': 16.20,
  61. 'node_labeled': True,
  62. 'edge_labeled': True,
  63. 'node_attr_dim': None,
  64. 'geometry': None,
  65. 'edge_attr_dim': None,
  66. 'url': 'https://iapr-tc15.greyc.fr/IAM/AIDS.zip',
  67. 'domain': 'small molecules',
  68. 'train_valid_test': ['data/train.cxl', 'data/valid.cxl', 'data/test.cxl',],
  69. 'stereoisomerism': False,
  70. 'load_files': ['data/'],
  71. },
  72. 'Alkane': {
  73. 'database': 'greyc',
  74. 'reference': None,
  75. 'dataset_size': 150,
  76. 'class_number': None,
  77. 'task_type': 'regression',
  78. 'ave_node_num': 8.87,
  79. 'ave_edge_num': 7.87,
  80. 'node_labeled': False,
  81. 'edge_labeled': False,
  82. 'node_attr_dim': 0,
  83. 'geometry': None,
  84. 'edge_attr_dim': 0,
  85. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/alkane_dataset.tar.gz',
  86. 'domain': 'small molecules',
  87. 'train_valid_test': None,
  88. 'stereoisomerism': False,
  89. 'load_files': ['dataset.ds', 'dataset_boiling_point_names.txt'],
  90. },
  91. 'Chiral': {
  92. 'database': 'greyc',
  93. 'reference': None,
  94. 'dataset_size': 35,
  95. 'class_number': None,
  96. 'task_type': 'regression',
  97. 'ave_node_num': 21.29,
  98. 'ave_edge_num': None,
  99. 'node_labeled': None,
  100. 'edge_labeled': None,
  101. 'node_attr_dim': None,
  102. 'geometry': None,
  103. 'edge_attr_dim': None,
  104. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/DatasetAcyclicChiral.tar',
  105. 'domain': 'small molecules',
  106. 'train_valid_test': [],
  107. 'stereoisomerism': True,
  108. 'load_files': ['data.txt'],
  109. 'extra_params': {'gformat': 'cml'}
  110. },
  111. 'MAO': {
  112. 'database': 'greyc',
  113. 'reference': None,
  114. 'dataset_size': 68,
  115. 'class_number': 2,
  116. 'task_type': 'classification',
  117. 'ave_node_num': 18.38,
  118. 'ave_edge_num': 19.63,
  119. 'node_labeled': True,
  120. 'edge_labeled': True,
  121. 'node_attr_dim': 0,
  122. 'geometry': None,
  123. 'edge_attr_dim': 0,
  124. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/mao.tgz',
  125. 'domain': 'small molecules',
  126. 'train_valid_test': None,
  127. 'stereoisomerism': False,
  128. 'load_files': ['dataset.ds'],
  129. },
  130. 'Monoterpenoides': {
  131. 'database': 'greyc',
  132. 'reference': None,
  133. 'dataset_size': 382,
  134. 'class_number': 10,
  135. 'task_type': 'classification',
  136. 'ave_node_num': 10,
  137. 'ave_edge_num': None,
  138. 'node_labeled': None,
  139. 'edge_labeled': None,
  140. 'node_attr_dim': None,
  141. 'geometry': None,
  142. 'edge_attr_dim': None,
  143. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/monoterpenoides.tar.gz',
  144. 'domain': 'small molecules',
  145. 'train_valid_test': None,
  146. 'stereoisomerism': False,
  147. 'load_files': ['dataset_10+.ds'],
  148. },
  149. 'PAH': {
  150. 'database': 'greyc',
  151. 'reference': None,
  152. 'dataset_size': 94,
  153. 'class_number': 2,
  154. 'task_type': 'classification',
  155. 'ave_node_num': 20.7,
  156. 'ave_edge_num': 24.43,
  157. 'node_labeled': False,
  158. 'edge_labeled': False,
  159. 'node_attr_dim': 0,
  160. 'geometry': None,
  161. 'edge_attr_dim': 0,
  162. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/PAH.tar.gz',
  163. 'domain': 'small molecules',
  164. 'train_valid_test': ['trainset_0.ds', None, 'testset_0.ds'],
  165. 'stereoisomerism': False,
  166. 'load_files': [['trainset_0.ds', 'testset_0.ds']],
  167. },
  168. 'PTC': {
  169. 'database': 'greyc',
  170. 'reference': None,
  171. 'dataset_size': 416,
  172. 'class_number': None,
  173. 'task_type': 'classification',
  174. 'ave_node_num': 14.4,
  175. 'ave_edge_num': None,
  176. 'node_labeled': None,
  177. 'edge_labeled': None,
  178. 'node_attr_dim': None,
  179. 'geometry': None,
  180. 'edge_attr_dim': None,
  181. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/ptc.tgz',
  182. 'domain': 'small molecules',
  183. 'train_valid_test': None,
  184. 'stereoisomerism': False,
  185. 'load_files': [],
  186. 'extra_info': 'This dataset has test and train datasets. Select gender between mm, fm, mr, fr. \ndataloader = DataLoader(\'Ptc\',root = ..., option = \'mm\') \ntest,train = dataloader.dataset \nGs_test, y_test = test \nGs_train_, y_train = train',
  187. },
  188. 'Steroid': {
  189. 'database': 'greyc',
  190. 'reference': None,
  191. 'dataset_size': 64,
  192. 'class_number': None,
  193. 'task_type': 'regression',
  194. 'ave_node_num': 75.11,
  195. 'ave_edge_num': None,
  196. 'node_labeled': None,
  197. 'edge_labeled': None,
  198. 'node_attr_dim': None,
  199. 'geometry': None,
  200. 'edge_attr_dim': None,
  201. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/SteroidDataset.tar',
  202. 'domain': 'small molecules',
  203. 'train_valid_test': ['trainset_0.ds', None, 'testset_0.ds'],
  204. 'stereoisomerism': False,
  205. 'load_files': [],
  206. },
  207. 'Vitamin_D': {
  208. 'database': 'greyc',
  209. 'reference': None,
  210. 'dataset_size': 69,
  211. 'class_number': None,
  212. 'task_type': 'regression',
  213. 'ave_node_num': 76.91,
  214. 'ave_edge_num': None,
  215. 'node_labeled': None,
  216. 'edge_labeled': None,
  217. 'node_attr_dim': None,
  218. 'geometry': None,
  219. 'edge_attr_dim': None,
  220. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/DatasetVitamin.tar',
  221. 'domain': 'small molecules',
  222. 'train_valid_test': [],
  223. 'stereoisomerism': True,
  224. 'load_files': ['data.txt'],
  225. 'extra_params': {'gformat': 'cml'}
  226. },
  227. }
  228. ### -------- database iam -------- ###
  229. # @todo: several datasets in this database are included in TUDataset. However they do not include train/valid/test sets.
  230. IAM_META = {
  231. 'GREC': {
  232. 'database': 'iam',
  233. 'reference': None,
  234. 'dataset_size': None,
  235. 'class_number': None,
  236. 'task_type': None,
  237. 'ave_node_num': None,
  238. 'ave_edge_num': None,
  239. 'node_labeled': None,
  240. 'edge_labeled': None,
  241. 'node_attr_dim': None,
  242. 'geometry': None,
  243. 'edge_attr_dim': None,
  244. 'url': 'https://iapr-tc15.greyc.fr/IAM/GREC.zip',
  245. 'domain': None,
  246. 'train_valid_test': ['data/test.cxl','data/train.cxl', 'data/valid.cxl'],
  247. 'load_files': [],
  248. },
  249. 'Web': {
  250. 'database': 'iam',
  251. 'reference': None,
  252. 'dataset_size': None,
  253. 'class_number': None,
  254. 'task_type': None,
  255. 'ave_node_num': None,
  256. 'ave_edge_num': None,
  257. 'node_labeled': None,
  258. 'edge_labeled': None,
  259. 'node_attr_dim': None,
  260. 'geometry': None,
  261. 'edge_attr_dim': None,
  262. 'url': 'https://iapr-tc15.greyc.fr/IAM/Web.zip',
  263. 'domain': None,
  264. 'train_valid_test': ['data/test.cxl', 'data/train.cxl', 'data/valid.cxl'],
  265. 'load_files': [],
  266. },
  267. }
  268. ### -------- database tudataset -------- ###
  269. TUDataset_META = {
  270. ### small molecules
  271. 'AIDS': {
  272. 'database': 'tudataset',
  273. 'reference': '[16,17]',
  274. 'dataset_size': 2000,
  275. 'class_number': 2,
  276. 'task_type': 'classification',
  277. 'ave_node_num': 15.69,
  278. 'ave_edge_num': 16.2,
  279. 'node_labeled': True,
  280. 'edge_labeled': True,
  281. 'node_attr_dim': 4,
  282. 'geometry': None,
  283. 'edge_attr_dim': 0,
  284. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/AIDS.zip',
  285. 'domain': 'small molecules',
  286. },
  287. 'alchemy_full': {
  288. 'database': 'tudataset',
  289. 'reference': '[29]',
  290. 'dataset_size': 202579,
  291. 'class_number': None,
  292. 'task_type': 'regression',
  293. 'ave_node_num': 10.1,
  294. 'ave_edge_num': 10.44,
  295. 'node_labeled': True,
  296. 'edge_labeled': True,
  297. 'node_attr_dim': 3,
  298. 'geometry': '3D, RI',
  299. 'edge_attr_dim': 0,
  300. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/alchemy_full.zip',
  301. 'domain': 'small molecules',
  302. },
  303. 'aspirin': {
  304. 'database': 'tudataset',
  305. 'reference': '[36]',
  306. 'dataset_size': 111763,
  307. 'class_number': None,
  308. 'task_type': 'regression',
  309. 'ave_node_num': 21.0,
  310. 'ave_edge_num': 151.52,
  311. 'node_labeled': True,
  312. 'edge_labeled': False,
  313. 'node_attr_dim': 6,
  314. 'geometry': '3D, RI',
  315. 'edge_attr_dim': 0,
  316. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/aspirin.zip',
  317. 'domain': 'small molecules',
  318. },
  319. 'benzene': {
  320. 'database': 'tudataset',
  321. 'reference': '[36]',
  322. 'dataset_size': 527984,
  323. 'class_number': None,
  324. 'task_type': 'regression',
  325. 'ave_node_num': 12.0,
  326. 'ave_edge_num': 64.94,
  327. 'node_labeled': True,
  328. 'edge_labeled': False,
  329. 'node_attr_dim': 6,
  330. 'geometry': '3D, RI',
  331. 'edge_attr_dim': 0,
  332. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/benzene.zip',
  333. 'domain': 'small molecules',
  334. },
  335. 'BZR': {
  336. 'database': 'tudataset',
  337. 'reference': '[7]',
  338. 'dataset_size': 405,
  339. 'class_number': 2,
  340. 'task_type': 'classification',
  341. 'ave_node_num': 35.75,
  342. 'ave_edge_num': 38.36,
  343. 'node_labeled': True,
  344. 'edge_labeled': False,
  345. 'node_attr_dim': 3,
  346. 'geometry': '3D, RI',
  347. 'edge_attr_dim': 0,
  348. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/BZR.zip',
  349. 'domain': 'small molecules',
  350. },
  351. 'BZR_MD': {
  352. 'database': 'tudataset',
  353. 'reference': '[7,23]',
  354. 'dataset_size': 306,
  355. 'class_number': 2,
  356. 'task_type': 'classification',
  357. 'ave_node_num': 21.3,
  358. 'ave_edge_num': 225.06,
  359. 'node_labeled': True,
  360. 'edge_labeled': True,
  361. 'node_attr_dim': 0,
  362. 'geometry': None,
  363. 'edge_attr_dim': 1,
  364. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/BZR_MD.zip',
  365. 'domain': 'small molecules',
  366. },
  367. 'COX2': {
  368. 'database': 'tudataset',
  369. 'reference': '[7]',
  370. 'dataset_size': 467,
  371. 'class_number': 2,
  372. 'task_type': 'classification',
  373. 'ave_node_num': 41.22,
  374. 'ave_edge_num': 43.45,
  375. 'node_labeled': True,
  376. 'edge_labeled': False,
  377. 'node_attr_dim': 3,
  378. 'geometry': '3D, RI',
  379. 'edge_attr_dim': 0,
  380. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COX2.zip',
  381. 'domain': 'small molecules',
  382. },
  383. 'COX2_MD': {
  384. 'database': 'tudataset',
  385. 'reference': '[7,23]',
  386. 'dataset_size': 303,
  387. 'class_number': 2,
  388. 'task_type': 'classification',
  389. 'ave_node_num': 26.28,
  390. 'ave_edge_num': 335.12,
  391. 'node_labeled': True,
  392. 'edge_labeled': True,
  393. 'node_attr_dim': 0,
  394. 'geometry': None,
  395. 'edge_attr_dim': 1,
  396. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COX2_MD.zip',
  397. 'domain': 'small molecules',
  398. },
  399. 'DHFR': {
  400. 'database': 'tudataset',
  401. 'reference': '[7]',
  402. 'dataset_size': 467,
  403. 'class_number': 2,
  404. 'task_type': 'classification',
  405. 'ave_node_num': 42.43,
  406. 'ave_edge_num': 44.54,
  407. 'node_labeled': True,
  408. 'edge_labeled': False,
  409. 'node_attr_dim': 3,
  410. 'geometry': '3D, RI',
  411. 'edge_attr_dim': 0,
  412. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DHFR.zip',
  413. 'domain': 'small molecules',
  414. },
  415. 'DHFR_MD': {
  416. 'database': 'tudataset',
  417. 'reference': '[7,23]',
  418. 'dataset_size': 393,
  419. 'class_number': 2,
  420. 'task_type': 'classification',
  421. 'ave_node_num': 23.87,
  422. 'ave_edge_num': 283.01,
  423. 'node_labeled': True,
  424. 'edge_labeled': True,
  425. 'node_attr_dim': 0,
  426. 'geometry': None,
  427. 'edge_attr_dim': 1,
  428. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DHFR_MD.zip',
  429. 'domain': 'small molecules',
  430. },
  431. 'ER_MD': {
  432. 'database': 'tudataset',
  433. 'reference': '[7,23]',
  434. 'dataset_size': 446,
  435. 'class_number': 2,
  436. 'task_type': 'classification',
  437. 'ave_node_num': 21.33,
  438. 'ave_edge_num': 234.85,
  439. 'node_labeled': True,
  440. 'edge_labeled': True,
  441. 'node_attr_dim': 0,
  442. 'geometry': None,
  443. 'edge_attr_dim': 1,
  444. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ER_MD.zip',
  445. 'domain': 'small molecules',
  446. },
  447. 'ethanol': {
  448. 'database': 'tudataset',
  449. 'reference': '[36]',
  450. 'dataset_size': 455093,
  451. 'class_number': None,
  452. 'task_type': 'regression',
  453. 'ave_node_num': 9.0,
  454. 'ave_edge_num': 36.0,
  455. 'node_labeled': True,
  456. 'edge_labeled': False,
  457. 'node_attr_dim': 6,
  458. 'geometry': '3D, RI',
  459. 'edge_attr_dim': 0,
  460. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ethanol.zip',
  461. 'domain': 'small molecules',
  462. },
  463. 'FRANKENSTEIN': {
  464. 'database': 'tudataset',
  465. 'reference': '[15]',
  466. 'dataset_size': 4337,
  467. 'class_number': 2,
  468. 'task_type': 'classification',
  469. 'ave_node_num': 16.9,
  470. 'ave_edge_num': 17.88,
  471. 'node_labeled': False,
  472. 'edge_labeled': False,
  473. 'node_attr_dim': 780,
  474. 'geometry': None,
  475. 'edge_attr_dim': 0,
  476. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/FRANKENSTEIN.zip',
  477. 'domain': 'small molecules',
  478. },
  479. 'malonaldehyde': {
  480. 'database': 'tudataset',
  481. 'reference': '[36]',
  482. 'dataset_size': 893238,
  483. 'class_number': None,
  484. 'task_type': 'regression',
  485. 'ave_node_num': 9.0,
  486. 'ave_edge_num': 36.0,
  487. 'node_labeled': True,
  488. 'edge_labeled': False,
  489. 'node_attr_dim': 6,
  490. 'geometry': '3D, RI',
  491. 'edge_attr_dim': 0,
  492. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/malonaldehyde.zip',
  493. 'domain': 'small molecules',
  494. },
  495. 'MCF-7': {
  496. 'database': 'tudataset',
  497. 'reference': '[28]',
  498. 'dataset_size': 27770,
  499. 'class_number': 2,
  500. 'task_type': 'classification',
  501. 'ave_node_num': 26.39,
  502. 'ave_edge_num': 28.52,
  503. 'node_labeled': True,
  504. 'edge_labeled': True,
  505. 'node_attr_dim': 0,
  506. 'geometry': None,
  507. 'edge_attr_dim': 0,
  508. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MCF-7.zip',
  509. 'domain': 'small molecules',
  510. },
  511. 'MCF-7H': {
  512. 'database': 'tudataset',
  513. 'reference': '[28]',
  514. 'dataset_size': 27770,
  515. 'class_number': 2,
  516. 'task_type': 'classification',
  517. 'ave_node_num': 47.3,
  518. 'ave_edge_num': 49.43,
  519. 'node_labeled': True,
  520. 'edge_labeled': True,
  521. 'node_attr_dim': 0,
  522. 'geometry': None,
  523. 'edge_attr_dim': 0,
  524. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MCF-7H.zip',
  525. 'domain': 'small molecules',
  526. },
  527. 'MOLT-4': {
  528. 'database': 'tudataset',
  529. 'reference': '[28]',
  530. 'dataset_size': 39765,
  531. 'class_number': 2,
  532. 'task_type': 'classification',
  533. 'ave_node_num': 26.09,
  534. 'ave_edge_num': 28.13,
  535. 'node_labeled': True,
  536. 'edge_labeled': True,
  537. 'node_attr_dim': 0,
  538. 'geometry': None,
  539. 'edge_attr_dim': 0,
  540. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MOLT-4.zip',
  541. 'domain': 'small molecules',
  542. },
  543. 'MOLT-4H': {
  544. 'database': 'tudataset',
  545. 'reference': '[28]',
  546. 'dataset_size': 39765,
  547. 'class_number': 2,
  548. 'task_type': 'classification',
  549. 'ave_node_num': 46.7,
  550. 'ave_edge_num': 48.73,
  551. 'node_labeled': True,
  552. 'edge_labeled': True,
  553. 'node_attr_dim': 0,
  554. 'geometry': None,
  555. 'edge_attr_dim': 0,
  556. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MOLT-4H.zip',
  557. 'domain': 'small molecules',
  558. },
  559. 'Mutagenicity': {
  560. 'database': 'tudataset',
  561. 'reference': '[16,20]',
  562. 'dataset_size': 4337,
  563. 'class_number': 2,
  564. 'task_type': 'classification',
  565. 'ave_node_num': 30.32,
  566. 'ave_edge_num': 30.77,
  567. 'node_labeled': True,
  568. 'edge_labeled': True,
  569. 'node_attr_dim': 0,
  570. 'geometry': None,
  571. 'edge_attr_dim': 0,
  572. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Mutagenicity.zip',
  573. 'domain': 'small molecules',
  574. },
  575. 'MUTAG': {
  576. 'database': 'tudataset',
  577. 'reference': '[1,23]',
  578. 'dataset_size': 188,
  579. 'class_number': 2,
  580. 'task_type': 'classification',
  581. 'ave_node_num': 17.93,
  582. 'ave_edge_num': 19.79,
  583. 'node_labeled': True,
  584. 'edge_labeled': True,
  585. 'node_attr_dim': 0,
  586. 'geometry': None,
  587. 'edge_attr_dim': 0,
  588. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MUTAG.zip',
  589. 'domain': 'small molecules',
  590. },
  591. 'naphthalene': {
  592. 'database': 'tudataset',
  593. 'reference': '[36]',
  594. 'dataset_size': 226256,
  595. 'class_number': None,
  596. 'task_type': 'regression',
  597. 'ave_node_num': 18.0,
  598. 'ave_edge_num': 127.37,
  599. 'node_labeled': True,
  600. 'edge_labeled': False,
  601. 'node_attr_dim': 6,
  602. 'geometry': '3D, RI',
  603. 'edge_attr_dim': 0,
  604. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/naphthalene.zip',
  605. 'domain': 'small molecules',
  606. },
  607. 'NCI1': {
  608. 'database': 'tudataset',
  609. 'reference': '[8,9,22]',
  610. 'dataset_size': 4110,
  611. 'class_number': 2,
  612. 'task_type': 'classification',
  613. 'ave_node_num': 29.87,
  614. 'ave_edge_num': 32.3,
  615. 'node_labeled': True,
  616. 'edge_labeled': False,
  617. 'node_attr_dim': 0,
  618. 'geometry': None,
  619. 'edge_attr_dim': 0,
  620. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI1.zip',
  621. 'domain': 'small molecules',
  622. },
  623. 'NCI109': {
  624. 'database': 'tudataset',
  625. 'reference': '[8,9,22]',
  626. 'dataset_size': 4127,
  627. 'class_number': 2,
  628. 'task_type': 'classification',
  629. 'ave_node_num': 29.68,
  630. 'ave_edge_num': 32.13,
  631. 'node_labeled': True,
  632. 'edge_labeled': False,
  633. 'node_attr_dim': 0,
  634. 'geometry': None,
  635. 'edge_attr_dim': 0,
  636. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI109.zip',
  637. 'domain': 'small molecules',
  638. },
  639. 'NCI-H23': {
  640. 'database': 'tudataset',
  641. 'reference': '[28]',
  642. 'dataset_size': 40353,
  643. 'class_number': 2,
  644. 'task_type': 'classification',
  645. 'ave_node_num': 26.07,
  646. 'ave_edge_num': 28.1,
  647. 'node_labeled': True,
  648. 'edge_labeled': True,
  649. 'node_attr_dim': 0,
  650. 'geometry': None,
  651. 'edge_attr_dim': 0,
  652. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI-H23.zip',
  653. 'domain': 'small molecules',
  654. },
  655. 'NCI-H23H': {
  656. 'database': 'tudataset',
  657. 'reference': '[28]',
  658. 'dataset_size': 40353,
  659. 'class_number': 2,
  660. 'task_type': 'classification',
  661. 'ave_node_num': 46.67,
  662. 'ave_edge_num': 48.69,
  663. 'node_labeled': True,
  664. 'edge_labeled': True,
  665. 'node_attr_dim': 0,
  666. 'geometry': None,
  667. 'edge_attr_dim': 0,
  668. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI-H23H.zip',
  669. 'domain': 'small molecules',
  670. },
  671. 'OVCAR-8': {
  672. 'database': 'tudataset',
  673. 'reference': '[28]',
  674. 'dataset_size': 40516,
  675. 'class_number': 2,
  676. 'task_type': 'classification',
  677. 'ave_node_num': 26.07,
  678. 'ave_edge_num': 28.1,
  679. 'node_labeled': True,
  680. 'edge_labeled': True,
  681. 'node_attr_dim': 0,
  682. 'geometry': None,
  683. 'edge_attr_dim': 0,
  684. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OVCAR-8.zip',
  685. 'domain': 'small molecules',
  686. },
  687. 'OVCAR-8H': {
  688. 'database': 'tudataset',
  689. 'reference': '[28]',
  690. 'dataset_size': 40516,
  691. 'class_number': 2,
  692. 'task_type': 'classification',
  693. 'ave_node_num': 46.67,
  694. 'ave_edge_num': 48.7,
  695. 'node_labeled': True,
  696. 'edge_labeled': True,
  697. 'node_attr_dim': 0,
  698. 'geometry': None,
  699. 'edge_attr_dim': 0,
  700. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OVCAR-8H.zip',
  701. 'domain': 'small molecules',
  702. },
  703. 'P388': {
  704. 'database': 'tudataset',
  705. 'reference': '[28]',
  706. 'dataset_size': 41472,
  707. 'class_number': 2,
  708. 'task_type': 'classification',
  709. 'ave_node_num': 22.11,
  710. 'ave_edge_num': 23.55,
  711. 'node_labeled': True,
  712. 'edge_labeled': True,
  713. 'node_attr_dim': 0,
  714. 'geometry': None,
  715. 'edge_attr_dim': 0,
  716. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/P388.zip',
  717. 'domain': 'small molecules',
  718. },
  719. 'P388H': {
  720. 'database': 'tudataset',
  721. 'reference': '[28]',
  722. 'dataset_size': 41472,
  723. 'class_number': 2,
  724. 'task_type': 'classification',
  725. 'ave_node_num': 40.44,
  726. 'ave_edge_num': 41.88,
  727. 'node_labeled': True,
  728. 'edge_labeled': True,
  729. 'node_attr_dim': 0,
  730. 'geometry': None,
  731. 'edge_attr_dim': 0,
  732. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/P388H.zip',
  733. 'domain': 'small molecules',
  734. },
  735. 'PC-3': {
  736. 'database': 'tudataset',
  737. 'reference': '[28]',
  738. 'dataset_size': 27509,
  739. 'class_number': 2,
  740. 'task_type': 'classification',
  741. 'ave_node_num': 26.35,
  742. 'ave_edge_num': 28.49,
  743. 'node_labeled': True,
  744. 'edge_labeled': True,
  745. 'node_attr_dim': 0,
  746. 'geometry': None,
  747. 'edge_attr_dim': 0,
  748. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PC-3.zip',
  749. 'domain': 'small molecules',
  750. },
  751. 'PC-3H': {
  752. 'database': 'tudataset',
  753. 'reference': '[28]',
  754. 'dataset_size': 27509,
  755. 'class_number': 2,
  756. 'task_type': 'classification',
  757. 'ave_node_num': 47.19,
  758. 'ave_edge_num': 49.32,
  759. 'node_labeled': True,
  760. 'edge_labeled': True,
  761. 'node_attr_dim': 0,
  762. 'geometry': None,
  763. 'edge_attr_dim': 0,
  764. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PC-3H.zip',
  765. 'domain': 'small molecules',
  766. },
  767. 'PTC_FM': {
  768. 'database': 'tudataset',
  769. 'reference': '[2,23]',
  770. 'dataset_size': 349,
  771. 'class_number': 2,
  772. 'task_type': 'classification',
  773. 'ave_node_num': 14.11,
  774. 'ave_edge_num': 14.48,
  775. 'node_labeled': True,
  776. 'edge_labeled': True,
  777. 'node_attr_dim': 0,
  778. 'geometry': None,
  779. 'edge_attr_dim': 0,
  780. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_FM.zip',
  781. 'domain': 'small molecules',
  782. },
  783. 'PTC_FR': {
  784. 'database': 'tudataset',
  785. 'reference': '[2,23]',
  786. 'dataset_size': 351,
  787. 'class_number': 2,
  788. 'task_type': 'classification',
  789. 'ave_node_num': 14.56,
  790. 'ave_edge_num': 15.0,
  791. 'node_labeled': True,
  792. 'edge_labeled': True,
  793. 'node_attr_dim': 0,
  794. 'geometry': None,
  795. 'edge_attr_dim': 0,
  796. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_FR.zip',
  797. 'domain': 'small molecules',
  798. },
  799. 'PTC_MM': {
  800. 'database': 'tudataset',
  801. 'reference': '[2,23]',
  802. 'dataset_size': 336,
  803. 'class_number': 2,
  804. 'task_type': 'classification',
  805. 'ave_node_num': 13.97,
  806. 'ave_edge_num': 14.32,
  807. 'node_labeled': True,
  808. 'edge_labeled': True,
  809. 'node_attr_dim': 0,
  810. 'geometry': None,
  811. 'edge_attr_dim': 0,
  812. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_MM.zip',
  813. 'domain': 'small molecules',
  814. },
  815. 'PTC_MR': {
  816. 'database': 'tudataset',
  817. 'reference': '[2,23]',
  818. 'dataset_size': 344,
  819. 'class_number': 2,
  820. 'task_type': 'classification',
  821. 'ave_node_num': 14.29,
  822. 'ave_edge_num': 14.69,
  823. 'node_labeled': True,
  824. 'edge_labeled': True,
  825. 'node_attr_dim': 0,
  826. 'geometry': None,
  827. 'edge_attr_dim': 0,
  828. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_MR.zip',
  829. 'domain': 'small molecules',
  830. },
  831. 'QM9': {
  832. 'database': 'tudataset',
  833. 'reference': '[33,34,35]',
  834. 'dataset_size': 129433,
  835. 'class_number': None,
  836. 'task_type': 'regression',
  837. 'ave_node_num': 18.03,
  838. 'ave_edge_num': 18.63,
  839. 'node_labeled': False,
  840. 'edge_labeled': False,
  841. 'node_attr_dim': 16,
  842. 'geometry': '3D, RI',
  843. 'edge_attr_dim': 4,
  844. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/QM9.zip',
  845. 'domain': 'small molecules',
  846. },
  847. 'salicylic_acid': {
  848. 'database': 'tudataset',
  849. 'reference': '[36]',
  850. 'dataset_size': 220232,
  851. 'class_number': None,
  852. 'task_type': 'regression',
  853. 'ave_node_num': 16.0,
  854. 'ave_edge_num': 104.13,
  855. 'node_labeled': True,
  856. 'edge_labeled': False,
  857. 'node_attr_dim': 6,
  858. 'geometry': '3D, RI',
  859. 'edge_attr_dim': 0,
  860. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/salicylic_acid.zip',
  861. 'domain': 'small molecules',
  862. },
  863. 'SF-295': {
  864. 'database': 'tudataset',
  865. 'reference': '[28]',
  866. 'dataset_size': 40271,
  867. 'class_number': 2,
  868. 'task_type': 'classification',
  869. 'ave_node_num': 26.06,
  870. 'ave_edge_num': 28.08,
  871. 'node_labeled': True,
  872. 'edge_labeled': True,
  873. 'node_attr_dim': 0,
  874. 'geometry': None,
  875. 'edge_attr_dim': 0,
  876. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SF-295.zip',
  877. 'domain': 'small molecules',
  878. },
  879. 'SF-295H': {
  880. 'database': 'tudataset',
  881. 'reference': '[28]',
  882. 'dataset_size': 40271,
  883. 'class_number': 2,
  884. 'task_type': 'classification',
  885. 'ave_node_num': 46.65,
  886. 'ave_edge_num': 48.68,
  887. 'node_labeled': True,
  888. 'edge_labeled': True,
  889. 'node_attr_dim': 0,
  890. 'geometry': None,
  891. 'edge_attr_dim': 0,
  892. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SF-295H.zip',
  893. 'domain': 'small molecules',
  894. },
  895. 'SN12C': {
  896. 'database': 'tudataset',
  897. 'reference': '[28]',
  898. 'dataset_size': 40004,
  899. 'class_number': 2,
  900. 'task_type': 'classification',
  901. 'ave_node_num': 26.08,
  902. 'ave_edge_num': 28.11,
  903. 'node_labeled': True,
  904. 'edge_labeled': True,
  905. 'node_attr_dim': 0,
  906. 'geometry': None,
  907. 'edge_attr_dim': 0,
  908. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SN12C.zip',
  909. 'domain': 'small molecules',
  910. },
  911. 'SN12CH': {
  912. 'database': 'tudataset',
  913. 'reference': '[28]',
  914. 'dataset_size': 40004,
  915. 'class_number': 2,
  916. 'task_type': 'classification',
  917. 'ave_node_num': 46.69,
  918. 'ave_edge_num': 48.71,
  919. 'node_labeled': True,
  920. 'edge_labeled': True,
  921. 'node_attr_dim': 0,
  922. 'geometry': None,
  923. 'edge_attr_dim': 0,
  924. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SN12CH.zip',
  925. 'domain': 'small molecules',
  926. },
  927. 'SW-620': {
  928. 'database': 'tudataset',
  929. 'reference': '[28]',
  930. 'dataset_size': 40532,
  931. 'class_number': 2,
  932. 'task_type': 'classification',
  933. 'ave_node_num': 26.05,
  934. 'ave_edge_num': 28.08,
  935. 'node_labeled': True,
  936. 'edge_labeled': True,
  937. 'node_attr_dim': 0,
  938. 'geometry': None,
  939. 'edge_attr_dim': 0,
  940. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SW-620.zip',
  941. 'domain': 'small molecules',
  942. },
  943. 'SW-620H': {
  944. 'database': 'tudataset',
  945. 'reference': '[28]',
  946. 'dataset_size': 40532,
  947. 'class_number': 2,
  948. 'task_type': 'classification',
  949. 'ave_node_num': 46.62,
  950. 'ave_edge_num': 48.65,
  951. 'node_labeled': True,
  952. 'edge_labeled': True,
  953. 'node_attr_dim': 0,
  954. 'geometry': None,
  955. 'edge_attr_dim': 0,
  956. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SW-620H.zip',
  957. 'domain': 'small molecules',
  958. },
  959. 'toluene': {
  960. 'database': 'tudataset',
  961. 'reference': '[36]',
  962. 'dataset_size': 342791,
  963. 'class_number': None,
  964. 'task_type': 'regression',
  965. 'ave_node_num': 15.0,
  966. 'ave_edge_num': 96.15,
  967. 'node_labeled': True,
  968. 'edge_labeled': False,
  969. 'node_attr_dim': 6,
  970. 'geometry': '3D, RI',
  971. 'edge_attr_dim': 0,
  972. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/toluene.zip',
  973. 'domain': 'small molecules',
  974. },
  975. 'Tox21_AhR_training': {
  976. 'database': 'tudataset',
  977. 'reference': '[24]',
  978. 'dataset_size': 8169,
  979. 'class_number': 2,
  980. 'task_type': 'classification',
  981. 'ave_node_num': 18.09,
  982. 'ave_edge_num': 18.5,
  983. 'node_labeled': True,
  984. 'edge_labeled': True,
  985. 'node_attr_dim': 0,
  986. 'geometry': None,
  987. 'edge_attr_dim': 0,
  988. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_training.zip',
  989. 'domain': 'small molecules',
  990. },
  991. 'Tox21_AhR_testing': {
  992. 'database': 'tudataset',
  993. 'reference': '[24]',
  994. 'dataset_size': 272,
  995. 'class_number': 2,
  996. 'task_type': 'classification',
  997. 'ave_node_num': 22.13,
  998. 'ave_edge_num': 23.05,
  999. 'node_labeled': True,
  1000. 'edge_labeled': True,
  1001. 'node_attr_dim': 0,
  1002. 'geometry': None,
  1003. 'edge_attr_dim': 0,
  1004. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_testing.zip',
  1005. 'domain': 'small molecules',
  1006. },
  1007. 'Tox21_AhR_evaluation': {
  1008. 'database': 'tudataset',
  1009. 'reference': '[24]',
  1010. 'dataset_size': 607,
  1011. 'class_number': 2,
  1012. 'task_type': 'classification',
  1013. 'ave_node_num': 17.64,
  1014. 'ave_edge_num': 18.06,
  1015. 'node_labeled': True,
  1016. 'edge_labeled': True,
  1017. 'node_attr_dim': 0,
  1018. 'geometry': None,
  1019. 'edge_attr_dim': 0,
  1020. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_evaluation.zip',
  1021. 'domain': 'small molecules',
  1022. },
  1023. 'Tox21_AR_training': {
  1024. 'database': 'tudataset',
  1025. 'reference': '[24]',
  1026. 'dataset_size': 9362,
  1027. 'class_number': 2,
  1028. 'task_type': 'classification',
  1029. 'ave_node_num': 18.39,
  1030. 'ave_edge_num': 18.84,
  1031. 'node_labeled': True,
  1032. 'edge_labeled': True,
  1033. 'node_attr_dim': 0,
  1034. 'geometry': None,
  1035. 'edge_attr_dim': 0,
  1036. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_training.zip',
  1037. 'domain': 'small molecules',
  1038. },
  1039. 'Tox21_AR_testing': {
  1040. 'database': 'tudataset',
  1041. 'reference': '[24]',
  1042. 'dataset_size': 292,
  1043. 'class_number': 2,
  1044. 'task_type': 'classification',
  1045. 'ave_node_num': 22.35,
  1046. 'ave_edge_num': 23.32,
  1047. 'node_labeled': True,
  1048. 'edge_labeled': True,
  1049. 'node_attr_dim': 0,
  1050. 'geometry': None,
  1051. 'edge_attr_dim': 0,
  1052. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_testing.zip',
  1053. 'domain': 'small molecules',
  1054. },
  1055. 'Tox21_AR_evaluation': {
  1056. 'database': 'tudataset',
  1057. 'reference': '[24]',
  1058. 'dataset_size': 585,
  1059. 'class_number': 2,
  1060. 'task_type': 'classification',
  1061. 'ave_node_num': 17.99,
  1062. 'ave_edge_num': 18.45,
  1063. 'node_labeled': True,
  1064. 'edge_labeled': True,
  1065. 'node_attr_dim': 0,
  1066. 'geometry': None,
  1067. 'edge_attr_dim': 0,
  1068. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_evaluation.zip',
  1069. 'domain': 'small molecules',
  1070. },
  1071. 'Tox21_AR-LBD_training': {
  1072. 'database': 'tudataset',
  1073. 'reference': '[24]',
  1074. 'dataset_size': 8599,
  1075. 'class_number': 2,
  1076. 'task_type': 'classification',
  1077. 'ave_node_num': 17.77,
  1078. 'ave_edge_num': 18.16,
  1079. 'node_labeled': True,
  1080. 'edge_labeled': True,
  1081. 'node_attr_dim': 0,
  1082. 'geometry': None,
  1083. 'edge_attr_dim': 0,
  1084. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_training.zip',
  1085. 'domain': 'small molecules',
  1086. },
  1087. 'Tox21_AR-LBD_testing': {
  1088. 'database': 'tudataset',
  1089. 'reference': '[24]',
  1090. 'dataset_size': 253,
  1091. 'class_number': 2,
  1092. 'task_type': 'classification',
  1093. 'ave_node_num': 21.85,
  1094. 'ave_edge_num': 22.73,
  1095. 'node_labeled': True,
  1096. 'edge_labeled': True,
  1097. 'node_attr_dim': 0,
  1098. 'geometry': None,
  1099. 'edge_attr_dim': 0,
  1100. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_testing.zip',
  1101. 'domain': 'small molecules',
  1102. },
  1103. 'Tox21_AR-LBD_evaluation': {
  1104. 'database': 'tudataset',
  1105. 'reference': '[24]',
  1106. 'dataset_size': 580,
  1107. 'class_number': 2,
  1108. 'task_type': 'classification',
  1109. 'ave_node_num': 17.09,
  1110. 'ave_edge_num': 17.42,
  1111. 'node_labeled': True,
  1112. 'edge_labeled': True,
  1113. 'node_attr_dim': 0,
  1114. 'geometry': None,
  1115. 'edge_attr_dim': 0,
  1116. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_evaluation.zip',
  1117. 'domain': 'small molecules',
  1118. },
  1119. 'Tox21_ARE_training': {
  1120. 'database': 'tudataset',
  1121. 'reference': '[24]',
  1122. 'dataset_size': 7167,
  1123. 'class_number': 2,
  1124. 'task_type': 'classification',
  1125. 'ave_node_num': 16.28,
  1126. 'ave_edge_num': 16.52,
  1127. 'node_labeled': True,
  1128. 'edge_labeled': True,
  1129. 'node_attr_dim': 0,
  1130. 'geometry': None,
  1131. 'edge_attr_dim': 0,
  1132. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_training.zip',
  1133. 'domain': 'small molecules',
  1134. },
  1135. 'Tox21_ARE_testing': {
  1136. 'database': 'tudataset',
  1137. 'reference': '[24]',
  1138. 'dataset_size': 234,
  1139. 'class_number': 2,
  1140. 'task_type': 'classification',
  1141. 'ave_node_num': 21.99,
  1142. 'ave_edge_num': 22.91,
  1143. 'node_labeled': True,
  1144. 'edge_labeled': True,
  1145. 'node_attr_dim': 0,
  1146. 'geometry': None,
  1147. 'edge_attr_dim': 0,
  1148. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_testing.zip',
  1149. 'domain': 'small molecules',
  1150. },
  1151. 'Tox21_ARE_evaluation': {
  1152. 'database': 'tudataset',
  1153. 'reference': '[24]',
  1154. 'dataset_size': 552,
  1155. 'class_number': 2,
  1156. 'task_type': 'classification',
  1157. 'ave_node_num': 17.01,
  1158. 'ave_edge_num': 17.33,
  1159. 'node_labeled': True,
  1160. 'edge_labeled': True,
  1161. 'node_attr_dim': 0,
  1162. 'geometry': None,
  1163. 'edge_attr_dim': 0,
  1164. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_evaluation.zip',
  1165. 'domain': 'small molecules',
  1166. },
  1167. 'Tox21_aromatase_training': {
  1168. 'database': 'tudataset',
  1169. 'reference': '[24]',
  1170. 'dataset_size': 7226,
  1171. 'class_number': 2,
  1172. 'task_type': 'classification',
  1173. 'ave_node_num': 17.5,
  1174. 'ave_edge_num': 17.79,
  1175. 'node_labeled': True,
  1176. 'edge_labeled': True,
  1177. 'node_attr_dim': 0,
  1178. 'geometry': None,
  1179. 'edge_attr_dim': 0,
  1180. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_training.zip',
  1181. 'domain': 'small molecules',
  1182. },
  1183. 'Tox21_aromatase_testing': {
  1184. 'database': 'tudataset',
  1185. 'reference': '[24]',
  1186. 'dataset_size': 214,
  1187. 'class_number': 2,
  1188. 'task_type': 'classification',
  1189. 'ave_node_num': 21.65,
  1190. 'ave_edge_num': 22.36,
  1191. 'node_labeled': True,
  1192. 'edge_labeled': True,
  1193. 'node_attr_dim': 0,
  1194. 'geometry': None,
  1195. 'edge_attr_dim': 0,
  1196. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_testing.zip',
  1197. 'domain': 'small molecules',
  1198. },
  1199. 'Tox21_aromatase_evaluation': {
  1200. 'database': 'tudataset',
  1201. 'reference': '[24]',
  1202. 'dataset_size': 528,
  1203. 'class_number': 2,
  1204. 'task_type': 'classification',
  1205. 'ave_node_num': 16.74,
  1206. 'ave_edge_num': 16.99,
  1207. 'node_labeled': True,
  1208. 'edge_labeled': True,
  1209. 'node_attr_dim': 0,
  1210. 'geometry': None,
  1211. 'edge_attr_dim': 0,
  1212. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_evaluation.zip',
  1213. 'domain': 'small molecules',
  1214. },
  1215. 'Tox21_ATAD5_training': {
  1216. 'database': 'tudataset',
  1217. 'reference': '[24]',
  1218. 'dataset_size': 9091,
  1219. 'class_number': 2,
  1220. 'task_type': 'classification',
  1221. 'ave_node_num': 17.89,
  1222. 'ave_edge_num': 18.3,
  1223. 'node_labeled': True,
  1224. 'edge_labeled': True,
  1225. 'node_attr_dim': 0,
  1226. 'geometry': None,
  1227. 'edge_attr_dim': 0,
  1228. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_training.zip',
  1229. 'domain': 'small molecules',
  1230. },
  1231. 'Tox21_ATAD5_testing': {
  1232. 'database': 'tudataset',
  1233. 'reference': '[24]',
  1234. 'dataset_size': 272,
  1235. 'class_number': 2,
  1236. 'task_type': 'classification',
  1237. 'ave_node_num': 21.99,
  1238. 'ave_edge_num': 22.89,
  1239. 'node_labeled': True,
  1240. 'edge_labeled': True,
  1241. 'node_attr_dim': 0,
  1242. 'geometry': None,
  1243. 'edge_attr_dim': 0,
  1244. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_testing.zip',
  1245. 'domain': 'small molecules',
  1246. },
  1247. 'Tox21_ATAD5_evaluation': {
  1248. 'database': 'tudataset',
  1249. 'reference': '[24]',
  1250. 'dataset_size': 619,
  1251. 'class_number': 2,
  1252. 'task_type': 'classification',
  1253. 'ave_node_num': 17.68,
  1254. 'ave_edge_num': 18.11,
  1255. 'node_labeled': True,
  1256. 'edge_labeled': True,
  1257. 'node_attr_dim': 0,
  1258. 'geometry': None,
  1259. 'edge_attr_dim': 0,
  1260. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_evaluation.zip',
  1261. 'domain': 'small molecules',
  1262. },
  1263. 'Tox21_ER_training': {
  1264. 'database': 'tudataset',
  1265. 'reference': '[24]',
  1266. 'dataset_size': 7697,
  1267. 'class_number': 2,
  1268. 'task_type': 'classification',
  1269. 'ave_node_num': 17.58,
  1270. 'ave_edge_num': 17.94,
  1271. 'node_labeled': True,
  1272. 'edge_labeled': True,
  1273. 'node_attr_dim': 0,
  1274. 'geometry': None,
  1275. 'edge_attr_dim': 0,
  1276. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_training.zip',
  1277. 'domain': 'small molecules',
  1278. },
  1279. 'Tox21_ER_testing': {
  1280. 'database': 'tudataset',
  1281. 'reference': '[24]',
  1282. 'dataset_size': 265,
  1283. 'class_number': 2,
  1284. 'task_type': 'classification',
  1285. 'ave_node_num': 22.16,
  1286. 'ave_edge_num': 23.13,
  1287. 'node_labeled': True,
  1288. 'edge_labeled': True,
  1289. 'node_attr_dim': 0,
  1290. 'geometry': None,
  1291. 'edge_attr_dim': 0,
  1292. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_testing.zip',
  1293. 'domain': 'small molecules',
  1294. },
  1295. 'Tox21_ER_evaluation': {
  1296. 'database': 'tudataset',
  1297. 'reference': '[24]',
  1298. 'dataset_size': 515,
  1299. 'class_number': 2,
  1300. 'task_type': 'classification',
  1301. 'ave_node_num': 17.66,
  1302. 'ave_edge_num': 18.1,
  1303. 'node_labeled': True,
  1304. 'edge_labeled': True,
  1305. 'node_attr_dim': 0,
  1306. 'geometry': None,
  1307. 'edge_attr_dim': 0,
  1308. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_evaluation.zip',
  1309. 'domain': 'small molecules',
  1310. },
  1311. 'Tox21_ER-LBD_training': {
  1312. 'database': 'tudataset',
  1313. 'reference': '[24]',
  1314. 'dataset_size': 8753,
  1315. 'class_number': 2,
  1316. 'task_type': 'classification',
  1317. 'ave_node_num': 18.06,
  1318. 'ave_edge_num': 18.47,
  1319. 'node_labeled': True,
  1320. 'edge_labeled': True,
  1321. 'node_attr_dim': 0,
  1322. 'geometry': None,
  1323. 'edge_attr_dim': 0,
  1324. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_training.zip',
  1325. 'domain': 'small molecules',
  1326. },
  1327. 'Tox21_ER-LBD_testing': {
  1328. 'database': 'tudataset',
  1329. 'reference': '[24]',
  1330. 'dataset_size': 287,
  1331. 'class_number': 2,
  1332. 'task_type': 'classification',
  1333. 'ave_node_num': 22.28,
  1334. 'ave_edge_num': 23.23,
  1335. 'node_labeled': True,
  1336. 'edge_labeled': True,
  1337. 'node_attr_dim': 0,
  1338. 'geometry': None,
  1339. 'edge_attr_dim': 0,
  1340. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_testing.zip',
  1341. 'domain': 'small molecules',
  1342. },
  1343. 'Tox21_ER-LBD_evaluation': {
  1344. 'database': 'tudataset',
  1345. 'reference': '[24]',
  1346. 'dataset_size': 599,
  1347. 'class_number': 2,
  1348. 'task_type': 'classification',
  1349. 'ave_node_num': 17.75,
  1350. 'ave_edge_num': 18.17,
  1351. 'node_labeled': True,
  1352. 'edge_labeled': True,
  1353. 'node_attr_dim': 0,
  1354. 'geometry': None,
  1355. 'edge_attr_dim': 0,
  1356. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_evaluation.zip',
  1357. 'domain': 'small molecules',
  1358. },
  1359. 'Tox21_HSE_training': {
  1360. 'database': 'tudataset',
  1361. 'reference': '[24]',
  1362. 'dataset_size': 8150,
  1363. 'class_number': 2,
  1364. 'task_type': 'classification',
  1365. 'ave_node_num': 16.72,
  1366. 'ave_edge_num': 17.04,
  1367. 'node_labeled': True,
  1368. 'edge_labeled': True,
  1369. 'node_attr_dim': 0,
  1370. 'geometry': None,
  1371. 'edge_attr_dim': 0,
  1372. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_training.zip',
  1373. 'domain': 'small molecules',
  1374. },
  1375. 'Tox21_HSE_testing': {
  1376. 'database': 'tudataset',
  1377. 'reference': '[24]',
  1378. 'dataset_size': 267,
  1379. 'class_number': 2,
  1380. 'task_type': 'classification',
  1381. 'ave_node_num': 22.07,
  1382. 'ave_edge_num': 23.0,
  1383. 'node_labeled': True,
  1384. 'edge_labeled': True,
  1385. 'node_attr_dim': 0,
  1386. 'geometry': None,
  1387. 'edge_attr_dim': 0,
  1388. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_testing.zip',
  1389. 'domain': 'small molecules',
  1390. },
  1391. 'Tox21_HSE_evaluation': {
  1392. 'database': 'tudataset',
  1393. 'reference': '[24]',
  1394. 'dataset_size': 607,
  1395. 'class_number': 2,
  1396. 'task_type': 'classification',
  1397. 'ave_node_num': 17.61,
  1398. 'ave_edge_num': 18.01,
  1399. 'node_labeled': True,
  1400. 'edge_labeled': True,
  1401. 'node_attr_dim': 0,
  1402. 'geometry': None,
  1403. 'edge_attr_dim': 0,
  1404. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_evaluation.zip',
  1405. 'domain': 'small molecules',
  1406. },
  1407. 'Tox21_MMP_training': {
  1408. 'database': 'tudataset',
  1409. 'reference': '[24]',
  1410. 'dataset_size': 7320,
  1411. 'class_number': 2,
  1412. 'task_type': 'classification',
  1413. 'ave_node_num': 17.49,
  1414. 'ave_edge_num': 17.83,
  1415. 'node_labeled': True,
  1416. 'edge_labeled': True,
  1417. 'node_attr_dim': 0,
  1418. 'geometry': None,
  1419. 'edge_attr_dim': 0,
  1420. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_training.zip',
  1421. 'domain': 'small molecules',
  1422. },
  1423. 'Tox21_MMP_testing': {
  1424. 'database': 'tudataset',
  1425. 'reference': '[24]',
  1426. 'dataset_size': 238,
  1427. 'class_number': 2,
  1428. 'task_type': 'classification',
  1429. 'ave_node_num': 21.68,
  1430. 'ave_edge_num': 22.55,
  1431. 'node_labeled': True,
  1432. 'edge_labeled': True,
  1433. 'node_attr_dim': 0,
  1434. 'geometry': None,
  1435. 'edge_attr_dim': 0,
  1436. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_testing.zip',
  1437. 'domain': 'small molecules',
  1438. },
  1439. 'Tox21_MMP_evaluation': {
  1440. 'database': 'tudataset',
  1441. 'reference': '[24]',
  1442. 'dataset_size': 541,
  1443. 'class_number': 2,
  1444. 'task_type': 'classification',
  1445. 'ave_node_num': 16.67,
  1446. 'ave_edge_num': 16.88,
  1447. 'node_labeled': True,
  1448. 'edge_labeled': True,
  1449. 'node_attr_dim': 0,
  1450. 'geometry': None,
  1451. 'edge_attr_dim': 0,
  1452. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_evaluation.zip',
  1453. 'domain': 'small molecules',
  1454. },
  1455. 'Tox21_p53_training': {
  1456. 'database': 'tudataset',
  1457. 'reference': '[24]',
  1458. 'dataset_size': 8634,
  1459. 'class_number': 2,
  1460. 'task_type': 'classification',
  1461. 'ave_node_num': 17.79,
  1462. 'ave_edge_num': 18.19,
  1463. 'node_labeled': True,
  1464. 'edge_labeled': True,
  1465. 'node_attr_dim': 0,
  1466. 'geometry': None,
  1467. 'edge_attr_dim': 0,
  1468. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_training.zip',
  1469. 'domain': 'small molecules',
  1470. },
  1471. 'Tox21_p53_testing': {
  1472. 'database': 'tudataset',
  1473. 'reference': '[24]',
  1474. 'dataset_size': 269,
  1475. 'class_number': 2,
  1476. 'task_type': 'classification',
  1477. 'ave_node_num': 22.14,
  1478. 'ave_edge_num': 23.04,
  1479. 'node_labeled': True,
  1480. 'edge_labeled': True,
  1481. 'node_attr_dim': 0,
  1482. 'geometry': None,
  1483. 'edge_attr_dim': 0,
  1484. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_testing.zip',
  1485. 'domain': 'small molecules',
  1486. },
  1487. 'Tox21_p53_evaluation': {
  1488. 'database': 'tudataset',
  1489. 'reference': '[24]',
  1490. 'dataset_size': 613,
  1491. 'class_number': 2,
  1492. 'task_type': 'classification',
  1493. 'ave_node_num': 17.34,
  1494. 'ave_edge_num': 17.72,
  1495. 'node_labeled': True,
  1496. 'edge_labeled': True,
  1497. 'node_attr_dim': 0,
  1498. 'geometry': None,
  1499. 'edge_attr_dim': 0,
  1500. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_evaluation.zip',
  1501. 'domain': 'small molecules',
  1502. },
  1503. 'Tox21_PPAR-gamma_training': {
  1504. 'database': 'tudataset',
  1505. 'reference': '[24]',
  1506. 'dataset_size': 8184,
  1507. 'class_number': 2,
  1508. 'task_type': 'classification',
  1509. 'ave_node_num': 17.23,
  1510. 'ave_edge_num': 17.55,
  1511. 'node_labeled': True,
  1512. 'edge_labeled': True,
  1513. 'node_attr_dim': 0,
  1514. 'geometry': None,
  1515. 'edge_attr_dim': 0,
  1516. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_training.zip',
  1517. 'domain': 'small molecules',
  1518. },
  1519. 'Tox21_PPAR-gamma_testing': {
  1520. 'database': 'tudataset',
  1521. 'reference': '[24]',
  1522. 'dataset_size': 267,
  1523. 'class_number': 2,
  1524. 'task_type': 'classification',
  1525. 'ave_node_num': 22.04,
  1526. 'ave_edge_num': 22.93,
  1527. 'node_labeled': True,
  1528. 'edge_labeled': True,
  1529. 'node_attr_dim': 0,
  1530. 'geometry': None,
  1531. 'edge_attr_dim': 0,
  1532. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_testing.zip',
  1533. 'domain': 'small molecules',
  1534. },
  1535. 'Tox21_PPAR-gamma_evaluation': {
  1536. 'database': 'tudataset',
  1537. 'reference': '[24]',
  1538. 'dataset_size': 602,
  1539. 'class_number': 2,
  1540. 'task_type': 'classification',
  1541. 'ave_node_num': 17.38,
  1542. 'ave_edge_num': 17.77,
  1543. 'node_labeled': True,
  1544. 'edge_labeled': True,
  1545. 'node_attr_dim': 0,
  1546. 'geometry': None,
  1547. 'edge_attr_dim': 0,
  1548. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_evaluation.zip',
  1549. 'domain': 'small molecules',
  1550. },
  1551. 'UACC257': {
  1552. 'database': 'tudataset',
  1553. 'reference': '[28]',
  1554. 'dataset_size': 39988,
  1555. 'class_number': 2,
  1556. 'task_type': 'classification',
  1557. 'ave_node_num': 26.09,
  1558. 'ave_edge_num': 28.12,
  1559. 'node_labeled': True,
  1560. 'edge_labeled': True,
  1561. 'node_attr_dim': 0,
  1562. 'geometry': None,
  1563. 'edge_attr_dim': 0,
  1564. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/UACC257.zip',
  1565. 'domain': 'small molecules',
  1566. },
  1567. 'UACC257H': {
  1568. 'database': 'tudataset',
  1569. 'reference': '[28]',
  1570. 'dataset_size': 39988,
  1571. 'class_number': 2,
  1572. 'task_type': 'classification',
  1573. 'ave_node_num': 46.68,
  1574. 'ave_edge_num': 48.71,
  1575. 'node_labeled': True,
  1576. 'edge_labeled': True,
  1577. 'node_attr_dim': 0,
  1578. 'geometry': None,
  1579. 'edge_attr_dim': 0,
  1580. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/UACC257H.zip',
  1581. 'domain': 'small molecules',
  1582. },
  1583. 'uracil': {
  1584. 'database': 'tudataset',
  1585. 'reference': '[36]',
  1586. 'dataset_size': 133770,
  1587. 'class_number': None,
  1588. 'task_type': 'regression',
  1589. 'ave_node_num': 12.0,
  1590. 'ave_edge_num': 64.44,
  1591. 'node_labeled': True,
  1592. 'edge_labeled': False,
  1593. 'node_attr_dim': 6,
  1594. 'geometry': '3D, RI',
  1595. 'edge_attr_dim': 0,
  1596. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/uracil.zip',
  1597. 'domain': 'small molecules',
  1598. },
  1599. 'Yeast': {
  1600. 'database': 'tudataset',
  1601. 'reference': '[28]',
  1602. 'dataset_size': 79601,
  1603. 'class_number': 2,
  1604. 'task_type': 'classification',
  1605. 'ave_node_num': 21.54,
  1606. 'ave_edge_num': 22.84,
  1607. 'node_labeled': True,
  1608. 'edge_labeled': True,
  1609. 'node_attr_dim': 0,
  1610. 'geometry': None,
  1611. 'edge_attr_dim': 0,
  1612. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Yeast.zip',
  1613. 'domain': 'small molecules',
  1614. },
  1615. 'YeastH': {
  1616. 'database': 'tudataset',
  1617. 'reference': '[28]',
  1618. 'dataset_size': 79601,
  1619. 'class_number': 2,
  1620. 'task_type': 'classification',
  1621. 'ave_node_num': 39.44,
  1622. 'ave_edge_num': 40.74,
  1623. 'node_labeled': True,
  1624. 'edge_labeled': True,
  1625. 'node_attr_dim': 0,
  1626. 'geometry': None,
  1627. 'edge_attr_dim': 0,
  1628. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/YeastH.zip',
  1629. 'domain': 'small molecules',
  1630. },
  1631. 'ZINC_full': {
  1632. 'database': 'tudataset',
  1633. 'reference': '[31]',
  1634. 'dataset_size': 249456,
  1635. 'class_number': None,
  1636. 'task_type': 'regression',
  1637. 'ave_node_num': 23.14,
  1638. 'ave_edge_num': 24.91,
  1639. 'node_labeled': True,
  1640. 'edge_labeled': True,
  1641. 'node_attr_dim': 0,
  1642. 'geometry': None,
  1643. 'edge_attr_dim': 0,
  1644. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_full.zip',
  1645. 'domain': 'small molecules',
  1646. },
  1647. 'ZINC_test': {
  1648. 'database': 'tudataset',
  1649. 'reference': '[31]',
  1650. 'dataset_size': 5000,
  1651. 'class_number': None,
  1652. 'task_type': 'regression',
  1653. 'ave_node_num': 23.1,
  1654. 'ave_edge_num': 24.83,
  1655. 'node_labeled': True,
  1656. 'edge_labeled': True,
  1657. 'node_attr_dim': 0,
  1658. 'geometry': None,
  1659. 'edge_attr_dim': 0,
  1660. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_test.zip',
  1661. 'domain': 'small molecules',
  1662. },
  1663. 'ZINC_train': {
  1664. 'database': 'tudataset',
  1665. 'reference': '[31]',
  1666. 'dataset_size': 220011,
  1667. 'class_number': None,
  1668. 'task_type': 'regression',
  1669. 'ave_node_num': 23.15,
  1670. 'ave_edge_num': 24.91,
  1671. 'node_labeled': True,
  1672. 'edge_labeled': True,
  1673. 'node_attr_dim': 0,
  1674. 'geometry': None,
  1675. 'edge_attr_dim': 0,
  1676. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_train.zip',
  1677. 'domain': 'small molecules',
  1678. },
  1679. 'ZINC_val': {
  1680. 'database': 'tudataset',
  1681. 'reference': '[31]',
  1682. 'dataset_size': 24445,
  1683. 'class_number': None,
  1684. 'task_type': 'regression',
  1685. 'ave_node_num': 23.13,
  1686. 'ave_edge_num': 24.88,
  1687. 'node_labeled': True,
  1688. 'edge_labeled': True,
  1689. 'node_attr_dim': 0,
  1690. 'geometry': None,
  1691. 'edge_attr_dim': 0,
  1692. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_val.zip',
  1693. 'domain': 'small molecules',
  1694. },
  1695. ### bioinformatics
  1696. 'DD': {
  1697. 'database': 'tudataset',
  1698. 'reference': '[6,22]',
  1699. 'dataset_size': 1178,
  1700. 'class_number': 2,
  1701. 'task_type': 'classification',
  1702. 'ave_node_num': 284.32,
  1703. 'ave_edge_num': 715.66,
  1704. 'node_labeled': True,
  1705. 'edge_labeled': False,
  1706. 'node_attr_dim': 0,
  1707. 'geometry': None,
  1708. 'edge_attr_dim': 0,
  1709. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DD.zip',
  1710. 'domain': 'bioinformatics',
  1711. },
  1712. 'ENZYMES': {
  1713. 'database': 'tudataset',
  1714. 'reference': '[4,5]',
  1715. 'dataset_size': 600,
  1716. 'class_number': 6,
  1717. 'task_type': 'classification',
  1718. 'ave_node_num': 32.63,
  1719. 'ave_edge_num': 62.14,
  1720. 'node_labeled': True,
  1721. 'edge_labeled': False,
  1722. 'node_attr_dim': 18,
  1723. 'geometry': None,
  1724. 'edge_attr_dim': 0,
  1725. 'url': 'http://www.chrsmrrs.com/graphkerneldatasets/ENZYMES.zip',
  1726. 'domain': 'bioinformatics',
  1727. },
  1728. 'KKI': {
  1729. 'database': 'tudataset',
  1730. 'reference': '[26]',
  1731. 'dataset_size': 83,
  1732. 'class_number': 2,
  1733. 'task_type': 'classification',
  1734. 'ave_node_num': 26.96,
  1735. 'ave_edge_num': 48.42,
  1736. 'node_labeled': True,
  1737. 'edge_labeled': False,
  1738. 'node_attr_dim': 0,
  1739. 'geometry': None,
  1740. 'edge_attr_dim': 0,
  1741. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/KKI.zip',
  1742. 'domain': 'bioinformatics',
  1743. },
  1744. 'OHSU': {
  1745. 'database': 'tudataset',
  1746. 'reference': '[26]',
  1747. 'dataset_size': 79,
  1748. 'class_number': 2,
  1749. 'task_type': 'classification',
  1750. 'ave_node_num': 82.01,
  1751. 'ave_edge_num': 199.66,
  1752. 'node_labeled': True,
  1753. 'edge_labeled': False,
  1754. 'node_attr_dim': 0,
  1755. 'geometry': None,
  1756. 'edge_attr_dim': 0,
  1757. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OHSU.zip',
  1758. 'domain': 'bioinformatics',
  1759. },
  1760. 'Peking_1': {
  1761. 'database': 'tudataset',
  1762. 'reference': '[26]',
  1763. 'dataset_size': 85,
  1764. 'class_number': 2,
  1765. 'task_type': 'classification',
  1766. 'ave_node_num': 39.31,
  1767. 'ave_edge_num': 77.35,
  1768. 'node_labeled': True,
  1769. 'edge_labeled': False,
  1770. 'node_attr_dim': 0,
  1771. 'geometry': None,
  1772. 'edge_attr_dim': 0,
  1773. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Peking_1.zip',
  1774. 'domain': 'bioinformatics',
  1775. },
  1776. 'PROTEINS': {
  1777. 'database': 'tudataset',
  1778. 'reference': '[4,6]',
  1779. 'dataset_size': 1113,
  1780. 'class_number': 2,
  1781. 'task_type': 'classification',
  1782. 'ave_node_num': 39.06,
  1783. 'ave_edge_num': 72.82,
  1784. 'node_labeled': True,
  1785. 'edge_labeled': False,
  1786. 'node_attr_dim': 1,
  1787. 'geometry': None,
  1788. 'edge_attr_dim': 0,
  1789. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PROTEINS.zip',
  1790. 'domain': 'bioinformatics',
  1791. },
  1792. 'PROTEINS_full': {
  1793. 'database': 'tudataset',
  1794. 'reference': '[4,6]',
  1795. 'dataset_size': 1113,
  1796. 'class_number': 2,
  1797. 'task_type': 'classification',
  1798. 'ave_node_num': 39.06,
  1799. 'ave_edge_num': 72.82,
  1800. 'node_labeled': True,
  1801. 'edge_labeled': False,
  1802. 'node_attr_dim': 29,
  1803. 'geometry': None,
  1804. 'edge_attr_dim': 0,
  1805. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PROTEINS_full.zip',
  1806. 'domain': 'bioinformatics',
  1807. },
  1808. ### computer vision
  1809. 'COIL-DEL': {
  1810. 'database': 'tudataset',
  1811. 'reference': '[16,18]',
  1812. 'dataset_size': 3900,
  1813. 'class_number': 100,
  1814. 'task_type': 'classification',
  1815. 'ave_node_num': 21.54,
  1816. 'ave_edge_num': 54.24,
  1817. 'node_labeled': False,
  1818. 'edge_labeled': True,
  1819. 'node_attr_dim': 2,
  1820. 'geometry': None,
  1821. 'edge_attr_dim': 0,
  1822. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COIL-DEL.zip',
  1823. 'domain': 'computer vision',
  1824. },
  1825. 'COIL-RAG': {
  1826. 'database': 'tudataset',
  1827. 'reference': '[16,18]',
  1828. 'dataset_size': 3900,
  1829. 'class_number': 100,
  1830. 'task_type': 'classification',
  1831. 'ave_node_num': 3.01,
  1832. 'ave_edge_num': 3.02,
  1833. 'node_labeled': False,
  1834. 'edge_labeled': False,
  1835. 'node_attr_dim': 64,
  1836. 'geometry': None,
  1837. 'edge_attr_dim': 1,
  1838. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COIL-RAG.zip',
  1839. 'domain': 'computer vision',
  1840. },
  1841. 'Cuneiform': {
  1842. 'database': 'tudataset',
  1843. 'reference': '[25]',
  1844. 'dataset_size': 267,
  1845. 'class_number': 30,
  1846. 'task_type': 'classification',
  1847. 'ave_node_num': 21.27,
  1848. 'ave_edge_num': 44.8,
  1849. 'node_labeled': True,
  1850. 'edge_labeled': True,
  1851. 'node_attr_dim': 3,
  1852. 'geometry': '3D',
  1853. 'edge_attr_dim': 2,
  1854. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Cuneiform.zip',
  1855. 'domain': 'computer vision',
  1856. },
  1857. 'Fingerprint': {
  1858. 'database': 'tudataset',
  1859. 'reference': '[16,19]',
  1860. 'dataset_size': 2800,
  1861. 'class_number': 4,
  1862. 'task_type': 'classification',
  1863. 'ave_node_num': 5.42,
  1864. 'ave_edge_num': 4.42,
  1865. 'node_labeled': False,
  1866. 'edge_labeled': False,
  1867. 'node_attr_dim': 2,
  1868. 'geometry': '2D',
  1869. 'edge_attr_dim': 2,
  1870. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Fingerprint.zip',
  1871. 'domain': 'computer vision',
  1872. },
  1873. 'FIRSTMM_DB': {
  1874. 'database': 'tudataset',
  1875. 'reference': '[11,12,13]',
  1876. 'dataset_size': 41,
  1877. 'class_number': 11,
  1878. 'task_type': 'classification',
  1879. 'ave_node_num': 1377.27,
  1880. 'ave_edge_num': 3074.1,
  1881. 'node_labeled': True,
  1882. 'edge_labeled': False,
  1883. 'node_attr_dim': 1,
  1884. 'geometry': None,
  1885. 'edge_attr_dim': 2,
  1886. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/FIRSTMM_DB.zip',
  1887. 'domain': 'computer vision',
  1888. },
  1889. 'Letter-high': {
  1890. 'database': 'tudataset',
  1891. 'reference': '[16]',
  1892. 'dataset_size': 2250,
  1893. 'class_number': 15,
  1894. 'task_type': 'classification',
  1895. 'ave_node_num': 4.67,
  1896. 'ave_edge_num': 4.5,
  1897. 'node_labeled': False,
  1898. 'edge_labeled': False,
  1899. 'node_attr_dim': 2,
  1900. 'geometry': '2D',
  1901. 'edge_attr_dim': 0,
  1902. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-high.zip',
  1903. 'domain': 'computer vision',
  1904. },
  1905. 'Letter-low': {
  1906. 'database': 'tudataset',
  1907. 'reference': '[16]',
  1908. 'dataset_size': 2250,
  1909. 'class_number': 15,
  1910. 'task_type': 'classification',
  1911. 'ave_node_num': 4.68,
  1912. 'ave_edge_num': 3.13,
  1913. 'node_labeled': False,
  1914. 'edge_labeled': False,
  1915. 'node_attr_dim': 2,
  1916. 'geometry': '2D',
  1917. 'edge_attr_dim': 0,
  1918. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-low.zip',
  1919. 'domain': 'computer vision',
  1920. },
  1921. 'Letter-med': {
  1922. 'database': 'tudataset',
  1923. 'reference': '[16]',
  1924. 'dataset_size': 2250,
  1925. 'class_number': 15,
  1926. 'task_type': 'classification',
  1927. 'ave_node_num': 4.67,
  1928. 'ave_edge_num': 4.5,
  1929. 'node_labeled': False,
  1930. 'edge_labeled': False,
  1931. 'node_attr_dim': 2,
  1932. 'geometry': '2D',
  1933. 'edge_attr_dim': 0,
  1934. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-med.zip',
  1935. 'domain': 'computer vision',
  1936. },
  1937. 'MSRC_9': {
  1938. 'database': 'tudataset',
  1939. 'reference': '[13]',
  1940. 'dataset_size': 221,
  1941. 'class_number': 8,
  1942. 'task_type': 'classification',
  1943. 'ave_node_num': 40.58,
  1944. 'ave_edge_num': 97.94,
  1945. 'node_labeled': True,
  1946. 'edge_labeled': False,
  1947. 'node_attr_dim': 0,
  1948. 'geometry': None,
  1949. 'edge_attr_dim': 0,
  1950. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_9.zip',
  1951. 'domain': 'computer vision',
  1952. },
  1953. 'MSRC_21': {
  1954. 'database': 'tudataset',
  1955. 'reference': '[13]',
  1956. 'dataset_size': 563,
  1957. 'class_number': 20,
  1958. 'task_type': 'classification',
  1959. 'ave_node_num': 77.52,
  1960. 'ave_edge_num': 198.32,
  1961. 'node_labeled': True,
  1962. 'edge_labeled': False,
  1963. 'node_attr_dim': 0,
  1964. 'geometry': None,
  1965. 'edge_attr_dim': 0,
  1966. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_21.zip',
  1967. 'domain': 'computer vision',
  1968. },
  1969. 'MSRC_21C': {
  1970. 'database': 'tudataset',
  1971. 'reference': '[13]',
  1972. 'dataset_size': 209,
  1973. 'class_number': 20,
  1974. 'task_type': 'classification',
  1975. 'ave_node_num': 40.28,
  1976. 'ave_edge_num': 96.6,
  1977. 'node_labeled': True,
  1978. 'edge_labeled': False,
  1979. 'node_attr_dim': 0,
  1980. 'geometry': None,
  1981. 'edge_attr_dim': 0,
  1982. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_21C.zip',
  1983. 'domain': 'computer vision',
  1984. },
  1985. ### social networks
  1986. 'COLLAB': {
  1987. 'database': 'tudataset',
  1988. 'reference': '[14]',
  1989. 'dataset_size': 5000,
  1990. 'class_number': 3,
  1991. 'task_type': 'classification',
  1992. 'ave_node_num': 74.49,
  1993. 'ave_edge_num': 2457.78,
  1994. 'node_labeled': False,
  1995. 'edge_labeled': False,
  1996. 'node_attr_dim': 0,
  1997. 'geometry': None,
  1998. 'edge_attr_dim': 0,
  1999. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COLLAB.zip',
  2000. 'domain': 'social networks',
  2001. },
  2002. 'dblp_ct1': {
  2003. 'database': 'tudataset',
  2004. 'reference': '[32]',
  2005. 'dataset_size': 755,
  2006. 'class_number': 2,
  2007. 'task_type': 'classification',
  2008. 'ave_node_num': 52.87,
  2009. 'ave_edge_num': 320.09,
  2010. 'node_labeled': False,
  2011. 'edge_labeled': False,
  2012. 'node_attr_dim': 0,
  2013. 'geometry': None,
  2014. 'edge_attr_dim': 'temporal',
  2015. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/dblp_ct1.zip',
  2016. 'domain': 'social networks',
  2017. },
  2018. 'dblp_ct2': {
  2019. 'database': 'tudataset',
  2020. 'reference': '[32]',
  2021. 'dataset_size': 755,
  2022. 'class_number': 2,
  2023. 'task_type': 'classification',
  2024. 'ave_node_num': 52.87,
  2025. 'ave_edge_num': 320.09,
  2026. 'node_labeled': False,
  2027. 'edge_labeled': False,
  2028. 'node_attr_dim': 0,
  2029. 'geometry': None,
  2030. 'edge_attr_dim': 'temporal',
  2031. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/dblp_ct2.zip',
  2032. 'domain': 'social networks',
  2033. },
  2034. 'DBLP_v1': {
  2035. 'database': 'tudataset',
  2036. 'reference': '[26]',
  2037. 'dataset_size': 19456,
  2038. 'class_number': 2,
  2039. 'task_type': 'classification',
  2040. 'ave_node_num': 10.48,
  2041. 'ave_edge_num': 19.65,
  2042. 'node_labeled': True,
  2043. 'edge_labeled': True,
  2044. 'node_attr_dim': 0,
  2045. 'geometry': None,
  2046. 'edge_attr_dim': 0,
  2047. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DBLP_v1.zip',
  2048. 'domain': 'social networks',
  2049. },
  2050. 'deezer_ego_nets': {
  2051. 'database': 'tudataset',
  2052. 'reference': '[30]',
  2053. 'dataset_size': 9629,
  2054. 'class_number': 2,
  2055. 'task_type': 'classification',
  2056. 'ave_node_num': 23.49,
  2057. 'ave_edge_num': 65.25,
  2058. 'node_labeled': False,
  2059. 'edge_labeled': False,
  2060. 'node_attr_dim': 0,
  2061. 'geometry': None,
  2062. 'edge_attr_dim': 0,
  2063. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/deezer_ego_nets.zip',
  2064. 'domain': 'social networks',
  2065. },
  2066. 'facebook_ct1': {
  2067. 'database': 'tudataset',
  2068. 'reference': '[32]',
  2069. 'dataset_size': 995,
  2070. 'class_number': 2,
  2071. 'task_type': 'classification',
  2072. 'ave_node_num': 95.72,
  2073. 'ave_edge_num': 269.01,
  2074. 'node_labeled': False,
  2075. 'edge_labeled': False,
  2076. 'node_attr_dim': 0,
  2077. 'geometry': None,
  2078. 'edge_attr_dim': 'temporal',
  2079. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/facebook_ct1.zip',
  2080. 'domain': 'social networks',
  2081. },
  2082. 'facebook_ct2': {
  2083. 'database': 'tudataset',
  2084. 'reference': '[32]',
  2085. 'dataset_size': 995,
  2086. 'class_number': 2,
  2087. 'task_type': 'classification',
  2088. 'ave_node_num': 95.72,
  2089. 'ave_edge_num': 269.01,
  2090. 'node_labeled': False,
  2091. 'edge_labeled': False,
  2092. 'node_attr_dim': 0,
  2093. 'geometry': None,
  2094. 'edge_attr_dim': 'temporal',
  2095. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/facebook_ct2.zip',
  2096. 'domain': 'social networks',
  2097. },
  2098. 'github_stargazers': {
  2099. 'database': 'tudataset',
  2100. 'reference': '[30]',
  2101. 'dataset_size': 12725,
  2102. 'class_number': 2,
  2103. 'task_type': 'classification',
  2104. 'ave_node_num': 113.79,
  2105. 'ave_edge_num': 234.64,
  2106. 'node_labeled': False,
  2107. 'edge_labeled': False,
  2108. 'node_attr_dim': 0,
  2109. 'geometry': None,
  2110. 'edge_attr_dim': 0,
  2111. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/github_stargazers.zip',
  2112. 'domain': 'social networks',
  2113. },
  2114. 'highschool_ct1': {
  2115. 'database': 'tudataset',
  2116. 'reference': '[32]',
  2117. 'dataset_size': 180,
  2118. 'class_number': 2,
  2119. 'task_type': 'classification',
  2120. 'ave_node_num': 52.32,
  2121. 'ave_edge_num': 544.81,
  2122. 'node_labeled': False,
  2123. 'edge_labeled': False,
  2124. 'node_attr_dim': 0,
  2125. 'geometry': None,
  2126. 'edge_attr_dim': 'temporal',
  2127. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/highschool_ct1.zip',
  2128. 'domain': 'social networks',
  2129. },
  2130. 'highschool_ct2': {
  2131. 'database': 'tudataset',
  2132. 'reference': '[32]',
  2133. 'dataset_size': 180,
  2134. 'class_number': 2,
  2135. 'task_type': 'classification',
  2136. 'ave_node_num': 52.32,
  2137. 'ave_edge_num': 544.81,
  2138. 'node_labeled': False,
  2139. 'edge_labeled': False,
  2140. 'node_attr_dim': 0,
  2141. 'geometry': None,
  2142. 'edge_attr_dim': 'temporal',
  2143. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/highschool_ct2.zip',
  2144. 'domain': 'social networks',
  2145. },
  2146. 'IMDB-BINARY': {
  2147. 'database': 'tudataset',
  2148. 'reference': '[14]',
  2149. 'dataset_size': 1000,
  2150. 'class_number': 2,
  2151. 'task_type': 'classification',
  2152. 'ave_node_num': 19.77,
  2153. 'ave_edge_num': 96.53,
  2154. 'node_labeled': False,
  2155. 'edge_labeled': False,
  2156. 'node_attr_dim': 0,
  2157. 'geometry': '',
  2158. 'edge_attr_dim': 0,
  2159. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/IMDB-BINARY.zip',
  2160. 'domain': 'social networks',
  2161. },
  2162. 'IMDB-MULTI': {
  2163. 'database': 'tudataset',
  2164. 'reference': '[14]',
  2165. 'dataset_size': 1500,
  2166. 'class_number': 3,
  2167. 'task_type': 'classification',
  2168. 'ave_node_num': 13.0,
  2169. 'ave_edge_num': 65.94,
  2170. 'node_labeled': False,
  2171. 'edge_labeled': False,
  2172. 'node_attr_dim': 0,
  2173. 'geometry': '',
  2174. 'edge_attr_dim': 0,
  2175. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/IMDB-MULTI.zip',
  2176. 'domain': 'social networks',
  2177. },
  2178. 'infectious_ct1': {
  2179. 'database': 'tudataset',
  2180. 'reference': '[32]',
  2181. 'dataset_size': 200,
  2182. 'class_number': 2,
  2183. 'task_type': 'classification',
  2184. 'ave_node_num': 50.0,
  2185. 'ave_edge_num': 459.72,
  2186. 'node_labeled': False,
  2187. 'edge_labeled': False,
  2188. 'node_attr_dim': 0,
  2189. 'geometry': None,
  2190. 'edge_attr_dim': 'temporal',
  2191. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/infectious_ct1.zip',
  2192. 'domain': 'social networks',
  2193. },
  2194. 'infectious_ct2': {
  2195. 'database': 'tudataset',
  2196. 'reference': '[32]',
  2197. 'dataset_size': 200,
  2198. 'class_number': 2,
  2199. 'task_type': 'classification',
  2200. 'ave_node_num': 50.0,
  2201. 'ave_edge_num': 459.72,
  2202. 'node_labeled': False,
  2203. 'edge_labeled': False,
  2204. 'node_attr_dim': 0,
  2205. 'geometry': None,
  2206. 'edge_attr_dim': 'temporal',
  2207. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/infectious_ct2.zip',
  2208. 'domain': 'social networks',
  2209. },
  2210. 'mit_ct1': {
  2211. 'database': 'tudataset',
  2212. 'reference': '[32]',
  2213. 'dataset_size': 97,
  2214. 'class_number': 2,
  2215. 'task_type': 'classification',
  2216. 'ave_node_num': 20.0,
  2217. 'ave_edge_num': 1469.15,
  2218. 'node_labeled': False,
  2219. 'edge_labeled': False,
  2220. 'node_attr_dim': 0,
  2221. 'geometry': None,
  2222. 'edge_attr_dim': 'temporal',
  2223. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/mit_ct1.zip',
  2224. 'domain': 'social networks',
  2225. },
  2226. 'mit_ct2': {
  2227. 'database': 'tudataset',
  2228. 'reference': '[32]',
  2229. 'dataset_size': 97,
  2230. 'class_number': 2,
  2231. 'task_type': 'classification',
  2232. 'ave_node_num': 20.0,
  2233. 'ave_edge_num': 1469.15,
  2234. 'node_labeled': False,
  2235. 'edge_labeled': False,
  2236. 'node_attr_dim': 0,
  2237. 'geometry': None,
  2238. 'edge_attr_dim': 'temporal',
  2239. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/mit_ct2.zip',
  2240. 'domain': 'social networks',
  2241. },
  2242. 'REDDIT-BINARY': {
  2243. 'database': 'tudataset',
  2244. 'reference': '[14]',
  2245. 'dataset_size': 2000,
  2246. 'class_number': 2,
  2247. 'task_type': 'classification',
  2248. 'ave_node_num': 429.63,
  2249. 'ave_edge_num': 497.75,
  2250. 'node_labeled': False,
  2251. 'edge_labeled': False,
  2252. 'node_attr_dim': 0,
  2253. 'geometry': None,
  2254. 'edge_attr_dim': 0,
  2255. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-BINARY.zip',
  2256. 'domain': 'social networks',
  2257. },
  2258. 'REDDIT-MULTI-5K': {
  2259. 'database': 'tudataset',
  2260. 'reference': '[14]',
  2261. 'dataset_size': 4999,
  2262. 'class_number': 5,
  2263. 'task_type': 'classification',
  2264. 'ave_node_num': 508.52,
  2265. 'ave_edge_num': 594.87,
  2266. 'node_labeled': False,
  2267. 'edge_labeled': False,
  2268. 'node_attr_dim': 0,
  2269. 'geometry': None,
  2270. 'edge_attr_dim': 0,
  2271. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-MULTI-5K.zip',
  2272. 'domain': 'social networks',
  2273. },
  2274. 'REDDIT-MULTI-12K': {
  2275. 'database': 'tudataset',
  2276. 'reference': '[14]',
  2277. 'dataset_size': 11929,
  2278. 'class_number': 11,
  2279. 'task_type': 'classification',
  2280. 'ave_node_num': 391.41,
  2281. 'ave_edge_num': 456.89,
  2282. 'node_labeled': False,
  2283. 'edge_labeled': False,
  2284. 'node_attr_dim': 0,
  2285. 'geometry': None,
  2286. 'edge_attr_dim': 0,
  2287. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-MULTI-12K.zip',
  2288. 'domain': 'social networks',
  2289. },
  2290. 'reddit_threads': {
  2291. 'database': 'tudataset',
  2292. 'reference': '[30]',
  2293. 'dataset_size': 203088,
  2294. 'class_number': 2,
  2295. 'task_type': 'classification',
  2296. 'ave_node_num': 23.93,
  2297. 'ave_edge_num': 24.99,
  2298. 'node_labeled': False,
  2299. 'edge_labeled': False,
  2300. 'node_attr_dim': 0,
  2301. 'geometry': None,
  2302. 'edge_attr_dim': 0,
  2303. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/reddit_threads.zip',
  2304. 'domain': 'social networks',
  2305. },
  2306. 'tumblr_ct1': {
  2307. 'database': 'tudataset',
  2308. 'reference': '[32]',
  2309. 'dataset_size': 373,
  2310. 'class_number': 2,
  2311. 'task_type': 'classification',
  2312. 'ave_node_num': 53.11,
  2313. 'ave_edge_num': 199.78,
  2314. 'node_labeled': False,
  2315. 'edge_labeled': False,
  2316. 'node_attr_dim': 0,
  2317. 'geometry': None,
  2318. 'edge_attr_dim': 'temporal',
  2319. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/tumblr_ct1.zip',
  2320. 'domain': 'social networks',
  2321. },
  2322. 'tumblr_ct2': {
  2323. 'database': 'tudataset',
  2324. 'reference': '[32]',
  2325. 'dataset_size': 373,
  2326. 'class_number': 2,
  2327. 'task_type': 'classification',
  2328. 'ave_node_num': 53.11,
  2329. 'ave_edge_num': 199.78,
  2330. 'node_labeled': False,
  2331. 'edge_labeled': False,
  2332. 'node_attr_dim': 0,
  2333. 'geometry': None,
  2334. 'edge_attr_dim': 'temporal',
  2335. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/tumblr_ct2.zip',
  2336. 'domain': 'social networks',
  2337. },
  2338. 'twitch_egos': {
  2339. 'database': 'tudataset',
  2340. 'reference': '[30]',
  2341. 'dataset_size': 127094,
  2342. 'class_number': 2,
  2343. 'task_type': 'classification',
  2344. 'ave_node_num': 29.67,
  2345. 'ave_edge_num': 86.59,
  2346. 'node_labeled': False,
  2347. 'edge_labeled': False,
  2348. 'node_attr_dim': 0,
  2349. 'geometry': None,
  2350. 'edge_attr_dim': 0,
  2351. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/twitch_egos.zip',
  2352. 'domain': 'social networks',
  2353. },
  2354. 'TWITTER-Real-Graph-Partial': {
  2355. 'database': 'tudataset',
  2356. 'reference': '[26]',
  2357. 'dataset_size': 144033,
  2358. 'class_number': 2,
  2359. 'task_type': 'classification',
  2360. 'ave_node_num': 4.03,
  2361. 'ave_edge_num': 4.98,
  2362. 'node_labeled': True,
  2363. 'edge_labeled': False,
  2364. 'node_attr_dim': 0,
  2365. 'geometry': None,
  2366. 'edge_attr_dim': 1,
  2367. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/TWITTER-Real-Graph-Partial.zip',
  2368. 'domain': 'social networks',
  2369. },
  2370. ### synthetic
  2371. 'COLORS-3': {
  2372. 'database': 'tudataset',
  2373. 'reference': '[27]',
  2374. 'dataset_size': 10500,
  2375. 'class_number': 11,
  2376. 'task_type': 'classification',
  2377. 'ave_node_num': 61.31,
  2378. 'ave_edge_num': 91.03,
  2379. 'node_labeled': False,
  2380. 'edge_labeled': False,
  2381. 'node_attr_dim': 4,
  2382. 'geometry': None,
  2383. 'edge_attr_dim': 0,
  2384. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COLORS-3.zip',
  2385. 'domain': 'synthetic',
  2386. },
  2387. 'SYNTHETIC': {
  2388. 'database': 'tudataset',
  2389. 'reference': '[3]',
  2390. 'dataset_size': 300,
  2391. 'class_number': 2,
  2392. 'task_type': 'classification',
  2393. 'ave_node_num': 100.0,
  2394. 'ave_edge_num': 196.0,
  2395. 'node_labeled': False,
  2396. 'edge_labeled': False,
  2397. 'node_attr_dim': 1,
  2398. 'geometry': None,
  2399. 'edge_attr_dim': 0,
  2400. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SYNTHETIC.zip',
  2401. 'domain': 'synthetic',
  2402. },
  2403. 'SYNTHETICnew': {
  2404. 'database': 'tudataset',
  2405. 'reference': '[3,10]',
  2406. 'dataset_size': 300,
  2407. 'class_number': 2,
  2408. 'task_type': 'classification',
  2409. 'ave_node_num': 100.0,
  2410. 'ave_edge_num': 196.25,
  2411. 'node_labeled': False,
  2412. 'edge_labeled': False,
  2413. 'node_attr_dim': 1,
  2414. 'geometry': None,
  2415. 'edge_attr_dim': 0,
  2416. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SYNTHETICnew.zip',
  2417. 'domain': 'synthetic',
  2418. },
  2419. 'Synthie': {
  2420. 'database': 'tudataset',
  2421. 'reference': '[21]',
  2422. 'dataset_size': 400,
  2423. 'class_number': 4,
  2424. 'task_type': 'classification',
  2425. 'ave_node_num': 95.0,
  2426. 'ave_edge_num': 172.93,
  2427. 'node_labeled': False,
  2428. 'edge_labeled': False,
  2429. 'node_attr_dim': 15,
  2430. 'geometry': None,
  2431. 'edge_attr_dim': 0,
  2432. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Synthie.zip',
  2433. 'domain': 'synthetic',
  2434. },
  2435. 'TRIANGLES': {
  2436. 'database': 'tudataset',
  2437. 'reference': '[27]',
  2438. 'dataset_size': 45000,
  2439. 'class_number': 10,
  2440. 'task_type': 'classification',
  2441. 'ave_node_num': 20.85,
  2442. 'ave_edge_num': 32.74,
  2443. 'node_labeled': False,
  2444. 'edge_labeled': False,
  2445. 'node_attr_dim': 0,
  2446. 'geometry': None,
  2447. 'edge_attr_dim': 0,
  2448. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/TRIANGLES.zip',
  2449. 'domain': 'synthetic',
  2450. },
  2451. }
  2452. DATASET_META = {**GREYC_META, **IAM_META, **TUDataset_META}
  2453. def list_of_databases():
  2454. """List names of all databases.
  2455. Returns
  2456. -------
  2457. list
  2458. The list of all databases.
  2459. """
  2460. return [i for i in DATABASES]
  2461. def list_of_datasets():
  2462. """List names of all datasets.
  2463. Returns
  2464. -------
  2465. list
  2466. The list of all datasets.
  2467. """
  2468. return [i for i in DATASET_META]

A Python package for graph kernels, graph edit distances and graph pre-image problem.