You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

metadata.py 65 kB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470247124722473247424752476247724782479248024812482248324842485
  1. #!/usr/bin/env python3
  2. # -*- coding: utf-8 -*-
  3. """
  4. Created on Tue Oct 20 14:25:49 2020
  5. @author: ljia
  6. """
  7. DATABASES = {
  8. 'greyc': 'https://brunl01.users.greyc.fr/CHEMISTRY/',
  9. 'iam': 'https://iapr-tc15.greyc.fr/IAM/',
  10. 'tudataset': 'http://graphlearning.io/docs/datasets/',
  11. }
  12. ### -------- database greyc -------- ###
  13. GREYC_META = {
  14. 'ACE': {
  15. 'database': 'greyc',
  16. 'reference': None,
  17. 'dataset_size': 32,
  18. 'class_number': 2,
  19. 'task_type': 'classification',
  20. 'ave_node_num': 52,
  21. 'ave_edge_num': None,
  22. 'node_labeled': None,
  23. 'edge_labeled': None,
  24. 'node_attr_dim': None,
  25. 'geometry': None,
  26. 'edge_attr_dim': None,
  27. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/ACEDataset.tar',
  28. 'domain': 'small molecules',
  29. 'train_valid_test': [],
  30. 'stereoisomerism': True,
  31. 'load_files': [],
  32. },
  33. 'Acyclic': {
  34. 'database': 'greyc',
  35. 'reference': None,
  36. 'dataset_size': 183,
  37. 'class_number': None,
  38. 'task_type': 'regression',
  39. 'ave_node_num': 8.15,
  40. 'ave_edge_num': 7.15,
  41. 'node_labeled': True,
  42. 'edge_labeled': False,
  43. 'node_attr_dim': 0,
  44. 'geometry': None,
  45. 'edge_attr_dim': 0,
  46. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/Acyclic.tar.gz',
  47. 'domain': 'small molecules',
  48. 'train_valid_test': None,
  49. 'stereoisomerism': False,
  50. 'load_files': ['dataset_bps.ds'],
  51. },
  52. 'AIDS_greyc': {
  53. 'database': 'greyc',
  54. 'reference': None,
  55. 'dataset_size': 2000,
  56. 'class_number': 2,
  57. 'task_type': 'classification',
  58. 'ave_node_num': 15.69,
  59. 'ave_edge_num': 16.20,
  60. 'node_labeled': True,
  61. 'edge_labeled': True,
  62. 'node_attr_dim': None,
  63. 'geometry': None,
  64. 'edge_attr_dim': None,
  65. 'url': 'https://iapr-tc15.greyc.fr/IAM/AIDS.zip',
  66. 'domain': 'small molecules',
  67. 'train_valid_test': ['data/train.cxl', 'data/valid.cxl', 'data/test.cxl',],
  68. 'stereoisomerism': False,
  69. 'load_files': ['data/'],
  70. },
  71. 'Alkane': {
  72. 'database': 'greyc',
  73. 'reference': None,
  74. 'dataset_size': 150,
  75. 'class_number': None,
  76. 'task_type': 'regression',
  77. 'ave_node_num': 8.87,
  78. 'ave_edge_num': 7.87,
  79. 'node_labeled': False,
  80. 'edge_labeled': False,
  81. 'node_attr_dim': 0,
  82. 'geometry': None,
  83. 'edge_attr_dim': 0,
  84. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/alkane_dataset.tar.gz',
  85. 'domain': 'small molecules',
  86. 'train_valid_test': None,
  87. 'stereoisomerism': False,
  88. 'load_files': ['dataset.ds', 'dataset_boiling_point_names.txt'],
  89. },
  90. 'Chiral': {
  91. 'database': 'greyc',
  92. 'reference': None,
  93. 'dataset_size': 35,
  94. 'class_number': None,
  95. 'task_type': 'regression',
  96. 'ave_node_num': 21.29,
  97. 'ave_edge_num': None,
  98. 'node_labeled': None,
  99. 'edge_labeled': None,
  100. 'node_attr_dim': None,
  101. 'geometry': None,
  102. 'edge_attr_dim': None,
  103. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/DatasetAcyclicChiral.tar',
  104. 'domain': 'small molecules',
  105. 'train_valid_test': [],
  106. 'stereoisomerism': True,
  107. 'load_files': [],
  108. },
  109. 'MAO': {
  110. 'database': 'greyc',
  111. 'reference': None,
  112. 'dataset_size': 68,
  113. 'class_number': 2,
  114. 'task_type': 'classification',
  115. 'ave_node_num': 18.38,
  116. 'ave_edge_num': 19.63,
  117. 'node_labeled': True,
  118. 'edge_labeled': True,
  119. 'node_attr_dim': 0,
  120. 'geometry': None,
  121. 'edge_attr_dim': 0,
  122. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/mao.tgz',
  123. 'domain': 'small molecules',
  124. 'train_valid_test': None,
  125. 'stereoisomerism': False,
  126. 'load_files': ['dataset.ds'],
  127. },
  128. 'Monoterpenoides': {
  129. 'database': 'greyc',
  130. 'reference': None,
  131. 'dataset_size': 382,
  132. 'class_number': 10,
  133. 'task_type': 'classification',
  134. 'ave_node_num': 10,
  135. 'ave_edge_num': None,
  136. 'node_labeled': None,
  137. 'edge_labeled': None,
  138. 'node_attr_dim': None,
  139. 'geometry': None,
  140. 'edge_attr_dim': None,
  141. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/monoterpenoides.tar.gz',
  142. 'domain': 'small molecules',
  143. 'train_valid_test': None,
  144. 'stereoisomerism': False,
  145. 'load_files': ['dataset_10+.ds'],
  146. },
  147. 'PAH': {
  148. 'database': 'greyc',
  149. 'reference': None,
  150. 'dataset_size': 94,
  151. 'class_number': 2,
  152. 'task_type': 'classification',
  153. 'ave_node_num': 20.7,
  154. 'ave_edge_num': 24.43,
  155. 'node_labeled': False,
  156. 'edge_labeled': False,
  157. 'node_attr_dim': 0,
  158. 'geometry': None,
  159. 'edge_attr_dim': 0,
  160. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/PAH.tar.gz',
  161. 'domain': 'small molecules',
  162. 'train_valid_test': ['trainset_0.ds', None, 'testset_0.ds'],
  163. 'stereoisomerism': False,
  164. 'load_files': [],
  165. },
  166. 'PTC': {
  167. 'database': 'greyc',
  168. 'reference': None,
  169. 'dataset_size': 416,
  170. 'class_number': None,
  171. 'task_type': 'classification',
  172. 'ave_node_num': 14.4,
  173. 'ave_edge_num': None,
  174. 'node_labeled': None,
  175. 'edge_labeled': None,
  176. 'node_attr_dim': None,
  177. 'geometry': None,
  178. 'edge_attr_dim': None,
  179. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/ptc.tgz',
  180. 'domain': 'small molecules',
  181. 'train_valid_test': None,
  182. 'stereoisomerism': False,
  183. 'load_files': [],
  184. 'extra_info': 'This dataset has test and train datasets. Select gender between mm, fm, mr, fr. \ndataloader = DataLoader(\'Ptc\',root = ..., option = \'mm\') \ntest,train = dataloader.dataset \nGs_test, y_test = test \nGs_train_, y_train = train',
  185. },
  186. 'Steroid': {
  187. 'database': 'greyc',
  188. 'reference': None,
  189. 'dataset_size': 64,
  190. 'class_number': None,
  191. 'task_type': 'regression',
  192. 'ave_node_num': 75.11,
  193. 'ave_edge_num': None,
  194. 'node_labeled': None,
  195. 'edge_labeled': None,
  196. 'node_attr_dim': None,
  197. 'geometry': None,
  198. 'edge_attr_dim': None,
  199. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/SteroidDataset.tar',
  200. 'domain': 'small molecules',
  201. 'train_valid_test': ['trainset_0.ds', None, 'testset_0.ds'],
  202. 'stereoisomerism': False,
  203. 'load_files': [],
  204. },
  205. 'Vitamin_D': {
  206. 'database': 'greyc',
  207. 'reference': None,
  208. 'dataset_size': 69,
  209. 'class_number': None,
  210. 'task_type': 'regression',
  211. 'ave_node_num': 76.91,
  212. 'ave_edge_num': None,
  213. 'node_labeled': None,
  214. 'edge_labeled': None,
  215. 'node_attr_dim': None,
  216. 'geometry': None,
  217. 'edge_attr_dim': None,
  218. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/DatasetVitamin.tar',
  219. 'domain': 'small molecules',
  220. 'train_valid_test': [],
  221. 'stereoisomerism': True,
  222. 'load_files': [],
  223. },
  224. }
  225. ### -------- database iam -------- ###
  226. # @todo: several datasets in this database are included in TUDataset. However they do not include train/valid/test sets.
  227. IAM_META = {
  228. 'GREC': {
  229. 'database': 'iam',
  230. 'reference': None,
  231. 'dataset_size': None,
  232. 'class_number': None,
  233. 'task_type': None,
  234. 'ave_node_num': None,
  235. 'ave_edge_num': None,
  236. 'node_labeled': None,
  237. 'edge_labeled': None,
  238. 'node_attr_dim': None,
  239. 'geometry': None,
  240. 'edge_attr_dim': None,
  241. 'url': 'https://iapr-tc15.greyc.fr/IAM/GREC.zip',
  242. 'domain': None,
  243. 'train_valid_test': ['data/test.cxl','data/train.cxl', 'data/valid.cxl'],
  244. 'load_files': [],
  245. },
  246. 'Web': {
  247. 'database': 'iam',
  248. 'reference': None,
  249. 'dataset_size': None,
  250. 'class_number': None,
  251. 'task_type': None,
  252. 'ave_node_num': None,
  253. 'ave_edge_num': None,
  254. 'node_labeled': None,
  255. 'edge_labeled': None,
  256. 'node_attr_dim': None,
  257. 'geometry': None,
  258. 'edge_attr_dim': None,
  259. 'url': 'https://iapr-tc15.greyc.fr/IAM/Web.zip',
  260. 'domain': None,
  261. 'train_valid_test': ['data/test.cxl', 'data/train.cxl', 'data/valid.cxl'],
  262. 'load_files': [],
  263. },
  264. }
  265. ### -------- database tudataset -------- ###
  266. TUDataset_META = {
  267. ### small molecules
  268. 'AIDS': {
  269. 'database': 'tudataset',
  270. 'reference': '[16,17]',
  271. 'dataset_size': 2000,
  272. 'class_number': 2,
  273. 'task_type': 'classification',
  274. 'ave_node_num': 15.69,
  275. 'ave_edge_num': 16.2,
  276. 'node_labeled': True,
  277. 'edge_labeled': True,
  278. 'node_attr_dim': 4,
  279. 'geometry': None,
  280. 'edge_attr_dim': 0,
  281. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/AIDS.zip',
  282. 'domain': 'small molecules',
  283. },
  284. 'alchemy_full': {
  285. 'database': 'tudataset',
  286. 'reference': '[29]',
  287. 'dataset_size': 202579,
  288. 'class_number': None,
  289. 'task_type': 'regression',
  290. 'ave_node_num': 10.1,
  291. 'ave_edge_num': 10.44,
  292. 'node_labeled': True,
  293. 'edge_labeled': True,
  294. 'node_attr_dim': 3,
  295. 'geometry': '3D, RI',
  296. 'edge_attr_dim': 0,
  297. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/alchemy_full.zip',
  298. 'domain': 'small molecules',
  299. },
  300. 'aspirin': {
  301. 'database': 'tudataset',
  302. 'reference': '[36]',
  303. 'dataset_size': 111763,
  304. 'class_number': None,
  305. 'task_type': 'regression',
  306. 'ave_node_num': 21.0,
  307. 'ave_edge_num': 151.52,
  308. 'node_labeled': True,
  309. 'edge_labeled': False,
  310. 'node_attr_dim': 6,
  311. 'geometry': '3D, RI',
  312. 'edge_attr_dim': 0,
  313. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/aspirin.zip',
  314. 'domain': 'small molecules',
  315. },
  316. 'benzene': {
  317. 'database': 'tudataset',
  318. 'reference': '[36]',
  319. 'dataset_size': 527984,
  320. 'class_number': None,
  321. 'task_type': 'regression',
  322. 'ave_node_num': 12.0,
  323. 'ave_edge_num': 64.94,
  324. 'node_labeled': True,
  325. 'edge_labeled': False,
  326. 'node_attr_dim': 6,
  327. 'geometry': '3D, RI',
  328. 'edge_attr_dim': 0,
  329. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/benzene.zip',
  330. 'domain': 'small molecules',
  331. },
  332. 'BZR': {
  333. 'database': 'tudataset',
  334. 'reference': '[7]',
  335. 'dataset_size': 405,
  336. 'class_number': 2,
  337. 'task_type': 'classification',
  338. 'ave_node_num': 35.75,
  339. 'ave_edge_num': 38.36,
  340. 'node_labeled': True,
  341. 'edge_labeled': False,
  342. 'node_attr_dim': 3,
  343. 'geometry': '3D, RI',
  344. 'edge_attr_dim': 0,
  345. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/BZR.zip',
  346. 'domain': 'small molecules',
  347. },
  348. 'BZR_MD': {
  349. 'database': 'tudataset',
  350. 'reference': '[7,23]',
  351. 'dataset_size': 306,
  352. 'class_number': 2,
  353. 'task_type': 'classification',
  354. 'ave_node_num': 21.3,
  355. 'ave_edge_num': 225.06,
  356. 'node_labeled': True,
  357. 'edge_labeled': True,
  358. 'node_attr_dim': 0,
  359. 'geometry': None,
  360. 'edge_attr_dim': 1,
  361. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/BZR_MD.zip',
  362. 'domain': 'small molecules',
  363. },
  364. 'COX2': {
  365. 'database': 'tudataset',
  366. 'reference': '[7]',
  367. 'dataset_size': 467,
  368. 'class_number': 2,
  369. 'task_type': 'classification',
  370. 'ave_node_num': 41.22,
  371. 'ave_edge_num': 43.45,
  372. 'node_labeled': True,
  373. 'edge_labeled': False,
  374. 'node_attr_dim': 3,
  375. 'geometry': '3D, RI',
  376. 'edge_attr_dim': 0,
  377. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COX2.zip',
  378. 'domain': 'small molecules',
  379. },
  380. 'COX2_MD': {
  381. 'database': 'tudataset',
  382. 'reference': '[7,23]',
  383. 'dataset_size': 303,
  384. 'class_number': 2,
  385. 'task_type': 'classification',
  386. 'ave_node_num': 26.28,
  387. 'ave_edge_num': 335.12,
  388. 'node_labeled': True,
  389. 'edge_labeled': True,
  390. 'node_attr_dim': 0,
  391. 'geometry': None,
  392. 'edge_attr_dim': 1,
  393. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COX2_MD.zip',
  394. 'domain': 'small molecules',
  395. },
  396. 'DHFR': {
  397. 'database': 'tudataset',
  398. 'reference': '[7]',
  399. 'dataset_size': 467,
  400. 'class_number': 2,
  401. 'task_type': 'classification',
  402. 'ave_node_num': 42.43,
  403. 'ave_edge_num': 44.54,
  404. 'node_labeled': True,
  405. 'edge_labeled': False,
  406. 'node_attr_dim': 3,
  407. 'geometry': '3D, RI',
  408. 'edge_attr_dim': 0,
  409. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DHFR.zip',
  410. 'domain': 'small molecules',
  411. },
  412. 'DHFR_MD': {
  413. 'database': 'tudataset',
  414. 'reference': '[7,23]',
  415. 'dataset_size': 393,
  416. 'class_number': 2,
  417. 'task_type': 'classification',
  418. 'ave_node_num': 23.87,
  419. 'ave_edge_num': 283.01,
  420. 'node_labeled': True,
  421. 'edge_labeled': True,
  422. 'node_attr_dim': 0,
  423. 'geometry': None,
  424. 'edge_attr_dim': 1,
  425. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DHFR_MD.zip',
  426. 'domain': 'small molecules',
  427. },
  428. 'ER_MD': {
  429. 'database': 'tudataset',
  430. 'reference': '[7,23]',
  431. 'dataset_size': 446,
  432. 'class_number': 2,
  433. 'task_type': 'classification',
  434. 'ave_node_num': 21.33,
  435. 'ave_edge_num': 234.85,
  436. 'node_labeled': True,
  437. 'edge_labeled': True,
  438. 'node_attr_dim': 0,
  439. 'geometry': None,
  440. 'edge_attr_dim': 1,
  441. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ER_MD.zip',
  442. 'domain': 'small molecules',
  443. },
  444. 'ethanol': {
  445. 'database': 'tudataset',
  446. 'reference': '[36]',
  447. 'dataset_size': 455093,
  448. 'class_number': None,
  449. 'task_type': 'regression',
  450. 'ave_node_num': 9.0,
  451. 'ave_edge_num': 36.0,
  452. 'node_labeled': True,
  453. 'edge_labeled': False,
  454. 'node_attr_dim': 6,
  455. 'geometry': '3D, RI',
  456. 'edge_attr_dim': 0,
  457. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ethanol.zip',
  458. 'domain': 'small molecules',
  459. },
  460. 'FRANKENSTEIN': {
  461. 'database': 'tudataset',
  462. 'reference': '[15]',
  463. 'dataset_size': 4337,
  464. 'class_number': 2,
  465. 'task_type': 'classification',
  466. 'ave_node_num': 16.9,
  467. 'ave_edge_num': 17.88,
  468. 'node_labeled': False,
  469. 'edge_labeled': False,
  470. 'node_attr_dim': 780,
  471. 'geometry': None,
  472. 'edge_attr_dim': 0,
  473. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/FRANKENSTEIN.zip',
  474. 'domain': 'small molecules',
  475. },
  476. 'malonaldehyde': {
  477. 'database': 'tudataset',
  478. 'reference': '[36]',
  479. 'dataset_size': 893238,
  480. 'class_number': None,
  481. 'task_type': 'regression',
  482. 'ave_node_num': 9.0,
  483. 'ave_edge_num': 36.0,
  484. 'node_labeled': True,
  485. 'edge_labeled': False,
  486. 'node_attr_dim': 6,
  487. 'geometry': '3D, RI',
  488. 'edge_attr_dim': 0,
  489. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/malonaldehyde.zip',
  490. 'domain': 'small molecules',
  491. },
  492. 'MCF-7': {
  493. 'database': 'tudataset',
  494. 'reference': '[28]',
  495. 'dataset_size': 27770,
  496. 'class_number': 2,
  497. 'task_type': 'classification',
  498. 'ave_node_num': 26.39,
  499. 'ave_edge_num': 28.52,
  500. 'node_labeled': True,
  501. 'edge_labeled': True,
  502. 'node_attr_dim': 0,
  503. 'geometry': None,
  504. 'edge_attr_dim': 0,
  505. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MCF-7.zip',
  506. 'domain': 'small molecules',
  507. },
  508. 'MCF-7H': {
  509. 'database': 'tudataset',
  510. 'reference': '[28]',
  511. 'dataset_size': 27770,
  512. 'class_number': 2,
  513. 'task_type': 'classification',
  514. 'ave_node_num': 47.3,
  515. 'ave_edge_num': 49.43,
  516. 'node_labeled': True,
  517. 'edge_labeled': True,
  518. 'node_attr_dim': 0,
  519. 'geometry': None,
  520. 'edge_attr_dim': 0,
  521. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MCF-7H.zip',
  522. 'domain': 'small molecules',
  523. },
  524. 'MOLT-4': {
  525. 'database': 'tudataset',
  526. 'reference': '[28]',
  527. 'dataset_size': 39765,
  528. 'class_number': 2,
  529. 'task_type': 'classification',
  530. 'ave_node_num': 26.09,
  531. 'ave_edge_num': 28.13,
  532. 'node_labeled': True,
  533. 'edge_labeled': True,
  534. 'node_attr_dim': 0,
  535. 'geometry': None,
  536. 'edge_attr_dim': 0,
  537. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MOLT-4.zip',
  538. 'domain': 'small molecules',
  539. },
  540. 'MOLT-4H': {
  541. 'database': 'tudataset',
  542. 'reference': '[28]',
  543. 'dataset_size': 39765,
  544. 'class_number': 2,
  545. 'task_type': 'classification',
  546. 'ave_node_num': 46.7,
  547. 'ave_edge_num': 48.73,
  548. 'node_labeled': True,
  549. 'edge_labeled': True,
  550. 'node_attr_dim': 0,
  551. 'geometry': None,
  552. 'edge_attr_dim': 0,
  553. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MOLT-4H.zip',
  554. 'domain': 'small molecules',
  555. },
  556. 'Mutagenicity': {
  557. 'database': 'tudataset',
  558. 'reference': '[16,20]',
  559. 'dataset_size': 4337,
  560. 'class_number': 2,
  561. 'task_type': 'classification',
  562. 'ave_node_num': 30.32,
  563. 'ave_edge_num': 30.77,
  564. 'node_labeled': True,
  565. 'edge_labeled': True,
  566. 'node_attr_dim': 0,
  567. 'geometry': None,
  568. 'edge_attr_dim': 0,
  569. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Mutagenicity.zip',
  570. 'domain': 'small molecules',
  571. },
  572. 'MUTAG': {
  573. 'database': 'tudataset',
  574. 'reference': '[1,23]',
  575. 'dataset_size': 188,
  576. 'class_number': 2,
  577. 'task_type': 'classification',
  578. 'ave_node_num': 17.93,
  579. 'ave_edge_num': 19.79,
  580. 'node_labeled': True,
  581. 'edge_labeled': True,
  582. 'node_attr_dim': 0,
  583. 'geometry': None,
  584. 'edge_attr_dim': 0,
  585. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MUTAG.zip',
  586. 'domain': 'small molecules',
  587. },
  588. 'naphthalene': {
  589. 'database': 'tudataset',
  590. 'reference': '[36]',
  591. 'dataset_size': 226256,
  592. 'class_number': None,
  593. 'task_type': 'regression',
  594. 'ave_node_num': 18.0,
  595. 'ave_edge_num': 127.37,
  596. 'node_labeled': True,
  597. 'edge_labeled': False,
  598. 'node_attr_dim': 6,
  599. 'geometry': '3D, RI',
  600. 'edge_attr_dim': 0,
  601. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/naphthalene.zip',
  602. 'domain': 'small molecules',
  603. },
  604. 'NCI1': {
  605. 'database': 'tudataset',
  606. 'reference': '[8,9,22]',
  607. 'dataset_size': 4110,
  608. 'class_number': 2,
  609. 'task_type': 'classification',
  610. 'ave_node_num': 29.87,
  611. 'ave_edge_num': 32.3,
  612. 'node_labeled': True,
  613. 'edge_labeled': False,
  614. 'node_attr_dim': 0,
  615. 'geometry': None,
  616. 'edge_attr_dim': 0,
  617. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI1.zip',
  618. 'domain': 'small molecules',
  619. },
  620. 'NCI109': {
  621. 'database': 'tudataset',
  622. 'reference': '[8,9,22]',
  623. 'dataset_size': 4127,
  624. 'class_number': 2,
  625. 'task_type': 'classification',
  626. 'ave_node_num': 29.68,
  627. 'ave_edge_num': 32.13,
  628. 'node_labeled': True,
  629. 'edge_labeled': False,
  630. 'node_attr_dim': 0,
  631. 'geometry': None,
  632. 'edge_attr_dim': 0,
  633. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI109.zip',
  634. 'domain': 'small molecules',
  635. },
  636. 'NCI-H23': {
  637. 'database': 'tudataset',
  638. 'reference': '[28]',
  639. 'dataset_size': 40353,
  640. 'class_number': 2,
  641. 'task_type': 'classification',
  642. 'ave_node_num': 26.07,
  643. 'ave_edge_num': 28.1,
  644. 'node_labeled': True,
  645. 'edge_labeled': True,
  646. 'node_attr_dim': 0,
  647. 'geometry': None,
  648. 'edge_attr_dim': 0,
  649. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI-H23.zip-H23',
  650. 'domain': 'small molecules',
  651. },
  652. 'NCI-H23H': {
  653. 'database': 'tudataset',
  654. 'reference': '[28]',
  655. 'dataset_size': 40353,
  656. 'class_number': 2,
  657. 'task_type': 'classification',
  658. 'ave_node_num': 46.67,
  659. 'ave_edge_num': 48.69,
  660. 'node_labeled': True,
  661. 'edge_labeled': True,
  662. 'node_attr_dim': 0,
  663. 'geometry': None,
  664. 'edge_attr_dim': 0,
  665. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI-H23H.zip-H23H',
  666. 'domain': 'small molecules',
  667. },
  668. 'OVCAR-8': {
  669. 'database': 'tudataset',
  670. 'reference': '[28]',
  671. 'dataset_size': 40516,
  672. 'class_number': 2,
  673. 'task_type': 'classification',
  674. 'ave_node_num': 26.07,
  675. 'ave_edge_num': 28.1,
  676. 'node_labeled': True,
  677. 'edge_labeled': True,
  678. 'node_attr_dim': 0,
  679. 'geometry': None,
  680. 'edge_attr_dim': 0,
  681. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OVCAR-8.zip-8',
  682. 'domain': 'small molecules',
  683. },
  684. 'OVCAR-8H': {
  685. 'database': 'tudataset',
  686. 'reference': '[28]',
  687. 'dataset_size': 40516,
  688. 'class_number': 2,
  689. 'task_type': 'classification',
  690. 'ave_node_num': 46.67,
  691. 'ave_edge_num': 48.7,
  692. 'node_labeled': True,
  693. 'edge_labeled': True,
  694. 'node_attr_dim': 0,
  695. 'geometry': None,
  696. 'edge_attr_dim': 0,
  697. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OVCAR-8H.zip-8H',
  698. 'domain': 'small molecules',
  699. },
  700. 'P388': {
  701. 'database': 'tudataset',
  702. 'reference': '[28]',
  703. 'dataset_size': 41472,
  704. 'class_number': 2,
  705. 'task_type': 'classification',
  706. 'ave_node_num': 22.11,
  707. 'ave_edge_num': 23.55,
  708. 'node_labeled': True,
  709. 'edge_labeled': True,
  710. 'node_attr_dim': 0,
  711. 'geometry': None,
  712. 'edge_attr_dim': 0,
  713. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/P388.zip',
  714. 'domain': 'small molecules',
  715. },
  716. 'P388H': {
  717. 'database': 'tudataset',
  718. 'reference': '[28]',
  719. 'dataset_size': 41472,
  720. 'class_number': 2,
  721. 'task_type': 'classification',
  722. 'ave_node_num': 40.44,
  723. 'ave_edge_num': 41.88,
  724. 'node_labeled': True,
  725. 'edge_labeled': True,
  726. 'node_attr_dim': 0,
  727. 'geometry': None,
  728. 'edge_attr_dim': 0,
  729. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/P388H.zip',
  730. 'domain': 'small molecules',
  731. },
  732. 'PC-3': {
  733. 'database': 'tudataset',
  734. 'reference': '[28]',
  735. 'dataset_size': 27509,
  736. 'class_number': 2,
  737. 'task_type': 'classification',
  738. 'ave_node_num': 26.35,
  739. 'ave_edge_num': 28.49,
  740. 'node_labeled': True,
  741. 'edge_labeled': True,
  742. 'node_attr_dim': 0,
  743. 'geometry': None,
  744. 'edge_attr_dim': 0,
  745. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PC-3.zip',
  746. 'domain': 'small molecules',
  747. },
  748. 'PC-3H': {
  749. 'database': 'tudataset',
  750. 'reference': '[28]',
  751. 'dataset_size': 27509,
  752. 'class_number': 2,
  753. 'task_type': 'classification',
  754. 'ave_node_num': 47.19,
  755. 'ave_edge_num': 49.32,
  756. 'node_labeled': True,
  757. 'edge_labeled': True,
  758. 'node_attr_dim': 0,
  759. 'geometry': None,
  760. 'edge_attr_dim': 0,
  761. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PC-3H.zip',
  762. 'domain': 'small molecules',
  763. },
  764. 'PTC_FM': {
  765. 'database': 'tudataset',
  766. 'reference': '[2,23]',
  767. 'dataset_size': 349,
  768. 'class_number': 2,
  769. 'task_type': 'classification',
  770. 'ave_node_num': 14.11,
  771. 'ave_edge_num': 14.48,
  772. 'node_labeled': True,
  773. 'edge_labeled': True,
  774. 'node_attr_dim': 0,
  775. 'geometry': None,
  776. 'edge_attr_dim': 0,
  777. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_FM.zip',
  778. 'domain': 'small molecules',
  779. },
  780. 'PTC_FR': {
  781. 'database': 'tudataset',
  782. 'reference': '[2,23]',
  783. 'dataset_size': 351,
  784. 'class_number': 2,
  785. 'task_type': 'classification',
  786. 'ave_node_num': 14.56,
  787. 'ave_edge_num': 15.0,
  788. 'node_labeled': True,
  789. 'edge_labeled': True,
  790. 'node_attr_dim': 0,
  791. 'geometry': None,
  792. 'edge_attr_dim': 0,
  793. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_FR.zip',
  794. 'domain': 'small molecules',
  795. },
  796. 'PTC_MM': {
  797. 'database': 'tudataset',
  798. 'reference': '[2,23]',
  799. 'dataset_size': 336,
  800. 'class_number': 2,
  801. 'task_type': 'classification',
  802. 'ave_node_num': 13.97,
  803. 'ave_edge_num': 14.32,
  804. 'node_labeled': True,
  805. 'edge_labeled': True,
  806. 'node_attr_dim': 0,
  807. 'geometry': None,
  808. 'edge_attr_dim': 0,
  809. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_MM.zip',
  810. 'domain': 'small molecules',
  811. },
  812. 'PTC_MR': {
  813. 'database': 'tudataset',
  814. 'reference': '[2,23]',
  815. 'dataset_size': 344,
  816. 'class_number': 2,
  817. 'task_type': 'classification',
  818. 'ave_node_num': 14.29,
  819. 'ave_edge_num': 14.69,
  820. 'node_labeled': True,
  821. 'edge_labeled': True,
  822. 'node_attr_dim': 0,
  823. 'geometry': None,
  824. 'edge_attr_dim': 0,
  825. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_MR.zip',
  826. 'domain': 'small molecules',
  827. },
  828. 'QM9': {
  829. 'database': 'tudataset',
  830. 'reference': '[33,34,35]',
  831. 'dataset_size': 129433,
  832. 'class_number': None,
  833. 'task_type': 'regression',
  834. 'ave_node_num': 18.03,
  835. 'ave_edge_num': 18.63,
  836. 'node_labeled': False,
  837. 'edge_labeled': False,
  838. 'node_attr_dim': 16,
  839. 'geometry': '3D, RI',
  840. 'edge_attr_dim': 4,
  841. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/QM9.zip',
  842. 'domain': 'small molecules',
  843. },
  844. 'salicylic_acid': {
  845. 'database': 'tudataset',
  846. 'reference': '[36]',
  847. 'dataset_size': 220232,
  848. 'class_number': None,
  849. 'task_type': 'regression',
  850. 'ave_node_num': 16.0,
  851. 'ave_edge_num': 104.13,
  852. 'node_labeled': True,
  853. 'edge_labeled': False,
  854. 'node_attr_dim': 6,
  855. 'geometry': '3D, RI',
  856. 'edge_attr_dim': 0,
  857. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/salicylic_acid.zip',
  858. 'domain': 'small molecules',
  859. },
  860. 'SF-295': {
  861. 'database': 'tudataset',
  862. 'reference': '[28]',
  863. 'dataset_size': 40271,
  864. 'class_number': 2,
  865. 'task_type': 'classification',
  866. 'ave_node_num': 26.06,
  867. 'ave_edge_num': 28.08,
  868. 'node_labeled': True,
  869. 'edge_labeled': True,
  870. 'node_attr_dim': 0,
  871. 'geometry': None,
  872. 'edge_attr_dim': 0,
  873. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SF-295.zip',
  874. 'domain': 'small molecules',
  875. },
  876. 'SF-295H': {
  877. 'database': 'tudataset',
  878. 'reference': '[28]',
  879. 'dataset_size': 40271,
  880. 'class_number': 2,
  881. 'task_type': 'classification',
  882. 'ave_node_num': 46.65,
  883. 'ave_edge_num': 48.68,
  884. 'node_labeled': True,
  885. 'edge_labeled': True,
  886. 'node_attr_dim': 0,
  887. 'geometry': None,
  888. 'edge_attr_dim': 0,
  889. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SF-295H.zip',
  890. 'domain': 'small molecules',
  891. },
  892. 'SN12C': {
  893. 'database': 'tudataset',
  894. 'reference': '[28]',
  895. 'dataset_size': 40004,
  896. 'class_number': 2,
  897. 'task_type': 'classification',
  898. 'ave_node_num': 26.08,
  899. 'ave_edge_num': 28.11,
  900. 'node_labeled': True,
  901. 'edge_labeled': True,
  902. 'node_attr_dim': 0,
  903. 'geometry': None,
  904. 'edge_attr_dim': 0,
  905. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SN12C.zip',
  906. 'domain': 'small molecules',
  907. },
  908. 'SN12CH': {
  909. 'database': 'tudataset',
  910. 'reference': '[28]',
  911. 'dataset_size': 40004,
  912. 'class_number': 2,
  913. 'task_type': 'classification',
  914. 'ave_node_num': 46.69,
  915. 'ave_edge_num': 48.71,
  916. 'node_labeled': True,
  917. 'edge_labeled': True,
  918. 'node_attr_dim': 0,
  919. 'geometry': None,
  920. 'edge_attr_dim': 0,
  921. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SN12CH.zip',
  922. 'domain': 'small molecules',
  923. },
  924. 'SW-620': {
  925. 'database': 'tudataset',
  926. 'reference': '[28]',
  927. 'dataset_size': 40532,
  928. 'class_number': 2,
  929. 'task_type': 'classification',
  930. 'ave_node_num': 26.05,
  931. 'ave_edge_num': 28.08,
  932. 'node_labeled': True,
  933. 'edge_labeled': True,
  934. 'node_attr_dim': 0,
  935. 'geometry': None,
  936. 'edge_attr_dim': 0,
  937. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SW-620.zip',
  938. 'domain': 'small molecules',
  939. },
  940. 'SW-620H': {
  941. 'database': 'tudataset',
  942. 'reference': '[28]',
  943. 'dataset_size': 40532,
  944. 'class_number': 2,
  945. 'task_type': 'classification',
  946. 'ave_node_num': 46.62,
  947. 'ave_edge_num': 48.65,
  948. 'node_labeled': True,
  949. 'edge_labeled': True,
  950. 'node_attr_dim': 0,
  951. 'geometry': None,
  952. 'edge_attr_dim': 0,
  953. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SW-620H.zip',
  954. 'domain': 'small molecules',
  955. },
  956. 'toluene': {
  957. 'database': 'tudataset',
  958. 'reference': '[36]',
  959. 'dataset_size': 342791,
  960. 'class_number': None,
  961. 'task_type': 'regression',
  962. 'ave_node_num': 15.0,
  963. 'ave_edge_num': 96.15,
  964. 'node_labeled': True,
  965. 'edge_labeled': False,
  966. 'node_attr_dim': 6,
  967. 'geometry': '3D, RI',
  968. 'edge_attr_dim': 0,
  969. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/toluene.zip',
  970. 'domain': 'small molecules',
  971. },
  972. 'Tox21_AhR_training': {
  973. 'database': 'tudataset',
  974. 'reference': '[24]',
  975. 'dataset_size': 8169,
  976. 'class_number': 2,
  977. 'task_type': 'classification',
  978. 'ave_node_num': 18.09,
  979. 'ave_edge_num': 18.5,
  980. 'node_labeled': True,
  981. 'edge_labeled': True,
  982. 'node_attr_dim': 0,
  983. 'geometry': None,
  984. 'edge_attr_dim': 0,
  985. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_training.zip',
  986. 'domain': 'small molecules',
  987. },
  988. 'Tox21_AhR_testing': {
  989. 'database': 'tudataset',
  990. 'reference': '[24]',
  991. 'dataset_size': 272,
  992. 'class_number': 2,
  993. 'task_type': 'classification',
  994. 'ave_node_num': 22.13,
  995. 'ave_edge_num': 23.05,
  996. 'node_labeled': True,
  997. 'edge_labeled': True,
  998. 'node_attr_dim': 0,
  999. 'geometry': None,
  1000. 'edge_attr_dim': 0,
  1001. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_testing.zip',
  1002. 'domain': 'small molecules',
  1003. },
  1004. 'Tox21_AhR_evaluation': {
  1005. 'database': 'tudataset',
  1006. 'reference': '[24]',
  1007. 'dataset_size': 607,
  1008. 'class_number': 2,
  1009. 'task_type': 'classification',
  1010. 'ave_node_num': 17.64,
  1011. 'ave_edge_num': 18.06,
  1012. 'node_labeled': True,
  1013. 'edge_labeled': True,
  1014. 'node_attr_dim': 0,
  1015. 'geometry': None,
  1016. 'edge_attr_dim': 0,
  1017. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_evaluation.zip',
  1018. 'domain': 'small molecules',
  1019. },
  1020. 'Tox21_AR_training': {
  1021. 'database': 'tudataset',
  1022. 'reference': '[24]',
  1023. 'dataset_size': 9362,
  1024. 'class_number': 2,
  1025. 'task_type': 'classification',
  1026. 'ave_node_num': 18.39,
  1027. 'ave_edge_num': 18.84,
  1028. 'node_labeled': True,
  1029. 'edge_labeled': True,
  1030. 'node_attr_dim': 0,
  1031. 'geometry': None,
  1032. 'edge_attr_dim': 0,
  1033. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_training.zip',
  1034. 'domain': 'small molecules',
  1035. },
  1036. 'Tox21_AR_testing': {
  1037. 'database': 'tudataset',
  1038. 'reference': '[24]',
  1039. 'dataset_size': 292,
  1040. 'class_number': 2,
  1041. 'task_type': 'classification',
  1042. 'ave_node_num': 22.35,
  1043. 'ave_edge_num': 23.32,
  1044. 'node_labeled': True,
  1045. 'edge_labeled': True,
  1046. 'node_attr_dim': 0,
  1047. 'geometry': None,
  1048. 'edge_attr_dim': 0,
  1049. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_testing.zip',
  1050. 'domain': 'small molecules',
  1051. },
  1052. 'Tox21_AR_evaluation': {
  1053. 'database': 'tudataset',
  1054. 'reference': '[24]',
  1055. 'dataset_size': 585,
  1056. 'class_number': 2,
  1057. 'task_type': 'classification',
  1058. 'ave_node_num': 17.99,
  1059. 'ave_edge_num': 18.45,
  1060. 'node_labeled': True,
  1061. 'edge_labeled': True,
  1062. 'node_attr_dim': 0,
  1063. 'geometry': None,
  1064. 'edge_attr_dim': 0,
  1065. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_evaluation.zip',
  1066. 'domain': 'small molecules',
  1067. },
  1068. 'Tox21_AR-LBD_training': {
  1069. 'database': 'tudataset',
  1070. 'reference': '[24]',
  1071. 'dataset_size': 8599,
  1072. 'class_number': 2,
  1073. 'task_type': 'classification',
  1074. 'ave_node_num': 17.77,
  1075. 'ave_edge_num': 18.16,
  1076. 'node_labeled': True,
  1077. 'edge_labeled': True,
  1078. 'node_attr_dim': 0,
  1079. 'geometry': None,
  1080. 'edge_attr_dim': 0,
  1081. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_training.zip',
  1082. 'domain': 'small molecules',
  1083. },
  1084. 'Tox21_AR-LBD_testing': {
  1085. 'database': 'tudataset',
  1086. 'reference': '[24]',
  1087. 'dataset_size': 253,
  1088. 'class_number': 2,
  1089. 'task_type': 'classification',
  1090. 'ave_node_num': 21.85,
  1091. 'ave_edge_num': 22.73,
  1092. 'node_labeled': True,
  1093. 'edge_labeled': True,
  1094. 'node_attr_dim': 0,
  1095. 'geometry': None,
  1096. 'edge_attr_dim': 0,
  1097. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_testing.zip',
  1098. 'domain': 'small molecules',
  1099. },
  1100. 'Tox21_AR-LBD_evaluation': {
  1101. 'database': 'tudataset',
  1102. 'reference': '[24]',
  1103. 'dataset_size': 580,
  1104. 'class_number': 2,
  1105. 'task_type': 'classification',
  1106. 'ave_node_num': 17.09,
  1107. 'ave_edge_num': 17.42,
  1108. 'node_labeled': True,
  1109. 'edge_labeled': True,
  1110. 'node_attr_dim': 0,
  1111. 'geometry': None,
  1112. 'edge_attr_dim': 0,
  1113. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_evaluation.zip',
  1114. 'domain': 'small molecules',
  1115. },
  1116. 'Tox21_ARE_training': {
  1117. 'database': 'tudataset',
  1118. 'reference': '[24]',
  1119. 'dataset_size': 7167,
  1120. 'class_number': 2,
  1121. 'task_type': 'classification',
  1122. 'ave_node_num': 16.28,
  1123. 'ave_edge_num': 16.52,
  1124. 'node_labeled': True,
  1125. 'edge_labeled': True,
  1126. 'node_attr_dim': 0,
  1127. 'geometry': None,
  1128. 'edge_attr_dim': 0,
  1129. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_training.zip',
  1130. 'domain': 'small molecules',
  1131. },
  1132. 'Tox21_ARE_testing': {
  1133. 'database': 'tudataset',
  1134. 'reference': '[24]',
  1135. 'dataset_size': 234,
  1136. 'class_number': 2,
  1137. 'task_type': 'classification',
  1138. 'ave_node_num': 21.99,
  1139. 'ave_edge_num': 22.91,
  1140. 'node_labeled': True,
  1141. 'edge_labeled': True,
  1142. 'node_attr_dim': 0,
  1143. 'geometry': None,
  1144. 'edge_attr_dim': 0,
  1145. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_testing.zip',
  1146. 'domain': 'small molecules',
  1147. },
  1148. 'Tox21_ARE_evaluation': {
  1149. 'database': 'tudataset',
  1150. 'reference': '[24]',
  1151. 'dataset_size': 552,
  1152. 'class_number': 2,
  1153. 'task_type': 'classification',
  1154. 'ave_node_num': 17.01,
  1155. 'ave_edge_num': 17.33,
  1156. 'node_labeled': True,
  1157. 'edge_labeled': True,
  1158. 'node_attr_dim': 0,
  1159. 'geometry': None,
  1160. 'edge_attr_dim': 0,
  1161. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_evaluation.zip',
  1162. 'domain': 'small molecules',
  1163. },
  1164. 'Tox21_aromatase_training': {
  1165. 'database': 'tudataset',
  1166. 'reference': '[24]',
  1167. 'dataset_size': 7226,
  1168. 'class_number': 2,
  1169. 'task_type': 'classification',
  1170. 'ave_node_num': 17.5,
  1171. 'ave_edge_num': 17.79,
  1172. 'node_labeled': True,
  1173. 'edge_labeled': True,
  1174. 'node_attr_dim': 0,
  1175. 'geometry': None,
  1176. 'edge_attr_dim': 0,
  1177. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_training.zip',
  1178. 'domain': 'small molecules',
  1179. },
  1180. 'Tox21_aromatase_testing': {
  1181. 'database': 'tudataset',
  1182. 'reference': '[24]',
  1183. 'dataset_size': 214,
  1184. 'class_number': 2,
  1185. 'task_type': 'classification',
  1186. 'ave_node_num': 21.65,
  1187. 'ave_edge_num': 22.36,
  1188. 'node_labeled': True,
  1189. 'edge_labeled': True,
  1190. 'node_attr_dim': 0,
  1191. 'geometry': None,
  1192. 'edge_attr_dim': 0,
  1193. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_testing.zip',
  1194. 'domain': 'small molecules',
  1195. },
  1196. 'Tox21_aromatase_evaluation': {
  1197. 'database': 'tudataset',
  1198. 'reference': '[24]',
  1199. 'dataset_size': 528,
  1200. 'class_number': 2,
  1201. 'task_type': 'classification',
  1202. 'ave_node_num': 16.74,
  1203. 'ave_edge_num': 16.99,
  1204. 'node_labeled': True,
  1205. 'edge_labeled': True,
  1206. 'node_attr_dim': 0,
  1207. 'geometry': None,
  1208. 'edge_attr_dim': 0,
  1209. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_evaluation.zip',
  1210. 'domain': 'small molecules',
  1211. },
  1212. 'Tox21_ATAD5_training': {
  1213. 'database': 'tudataset',
  1214. 'reference': '[24]',
  1215. 'dataset_size': 9091,
  1216. 'class_number': 2,
  1217. 'task_type': 'classification',
  1218. 'ave_node_num': 17.89,
  1219. 'ave_edge_num': 18.3,
  1220. 'node_labeled': True,
  1221. 'edge_labeled': True,
  1222. 'node_attr_dim': 0,
  1223. 'geometry': None,
  1224. 'edge_attr_dim': 0,
  1225. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_training.zip',
  1226. 'domain': 'small molecules',
  1227. },
  1228. 'Tox21_ATAD5_testing': {
  1229. 'database': 'tudataset',
  1230. 'reference': '[24]',
  1231. 'dataset_size': 272,
  1232. 'class_number': 2,
  1233. 'task_type': 'classification',
  1234. 'ave_node_num': 21.99,
  1235. 'ave_edge_num': 22.89,
  1236. 'node_labeled': True,
  1237. 'edge_labeled': True,
  1238. 'node_attr_dim': 0,
  1239. 'geometry': None,
  1240. 'edge_attr_dim': 0,
  1241. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_testing.zip',
  1242. 'domain': 'small molecules',
  1243. },
  1244. 'Tox21_ATAD5_evaluation': {
  1245. 'database': 'tudataset',
  1246. 'reference': '[24]',
  1247. 'dataset_size': 619,
  1248. 'class_number': 2,
  1249. 'task_type': 'classification',
  1250. 'ave_node_num': 17.68,
  1251. 'ave_edge_num': 18.11,
  1252. 'node_labeled': True,
  1253. 'edge_labeled': True,
  1254. 'node_attr_dim': 0,
  1255. 'geometry': None,
  1256. 'edge_attr_dim': 0,
  1257. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_evaluation.zip',
  1258. 'domain': 'small molecules',
  1259. },
  1260. 'Tox21_ER_training': {
  1261. 'database': 'tudataset',
  1262. 'reference': '[24]',
  1263. 'dataset_size': 7697,
  1264. 'class_number': 2,
  1265. 'task_type': 'classification',
  1266. 'ave_node_num': 17.58,
  1267. 'ave_edge_num': 17.94,
  1268. 'node_labeled': True,
  1269. 'edge_labeled': True,
  1270. 'node_attr_dim': 0,
  1271. 'geometry': None,
  1272. 'edge_attr_dim': 0,
  1273. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_training.zip',
  1274. 'domain': 'small molecules',
  1275. },
  1276. 'Tox21_ER_testing': {
  1277. 'database': 'tudataset',
  1278. 'reference': '[24]',
  1279. 'dataset_size': 265,
  1280. 'class_number': 2,
  1281. 'task_type': 'classification',
  1282. 'ave_node_num': 22.16,
  1283. 'ave_edge_num': 23.13,
  1284. 'node_labeled': True,
  1285. 'edge_labeled': True,
  1286. 'node_attr_dim': 0,
  1287. 'geometry': None,
  1288. 'edge_attr_dim': 0,
  1289. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_testing.zip',
  1290. 'domain': 'small molecules',
  1291. },
  1292. 'Tox21_ER_evaluation': {
  1293. 'database': 'tudataset',
  1294. 'reference': '[24]',
  1295. 'dataset_size': 515,
  1296. 'class_number': 2,
  1297. 'task_type': 'classification',
  1298. 'ave_node_num': 17.66,
  1299. 'ave_edge_num': 18.1,
  1300. 'node_labeled': True,
  1301. 'edge_labeled': True,
  1302. 'node_attr_dim': 0,
  1303. 'geometry': None,
  1304. 'edge_attr_dim': 0,
  1305. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_evaluation.zip',
  1306. 'domain': 'small molecules',
  1307. },
  1308. 'Tox21_ER-LBD_training': {
  1309. 'database': 'tudataset',
  1310. 'reference': '[24]',
  1311. 'dataset_size': 8753,
  1312. 'class_number': 2,
  1313. 'task_type': 'classification',
  1314. 'ave_node_num': 18.06,
  1315. 'ave_edge_num': 18.47,
  1316. 'node_labeled': True,
  1317. 'edge_labeled': True,
  1318. 'node_attr_dim': 0,
  1319. 'geometry': None,
  1320. 'edge_attr_dim': 0,
  1321. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_training.zip',
  1322. 'domain': 'small molecules',
  1323. },
  1324. 'Tox21_ER-LBD_testing': {
  1325. 'database': 'tudataset',
  1326. 'reference': '[24]',
  1327. 'dataset_size': 287,
  1328. 'class_number': 2,
  1329. 'task_type': 'classification',
  1330. 'ave_node_num': 22.28,
  1331. 'ave_edge_num': 23.23,
  1332. 'node_labeled': True,
  1333. 'edge_labeled': True,
  1334. 'node_attr_dim': 0,
  1335. 'geometry': None,
  1336. 'edge_attr_dim': 0,
  1337. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_testing.zip',
  1338. 'domain': 'small molecules',
  1339. },
  1340. 'Tox21_ER-LBD_evaluation': {
  1341. 'database': 'tudataset',
  1342. 'reference': '[24]',
  1343. 'dataset_size': 599,
  1344. 'class_number': 2,
  1345. 'task_type': 'classification',
  1346. 'ave_node_num': 17.75,
  1347. 'ave_edge_num': 18.17,
  1348. 'node_labeled': True,
  1349. 'edge_labeled': True,
  1350. 'node_attr_dim': 0,
  1351. 'geometry': None,
  1352. 'edge_attr_dim': 0,
  1353. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_evaluation.zip',
  1354. 'domain': 'small molecules',
  1355. },
  1356. 'Tox21_HSE_training': {
  1357. 'database': 'tudataset',
  1358. 'reference': '[24]',
  1359. 'dataset_size': 8150,
  1360. 'class_number': 2,
  1361. 'task_type': 'classification',
  1362. 'ave_node_num': 16.72,
  1363. 'ave_edge_num': 17.04,
  1364. 'node_labeled': True,
  1365. 'edge_labeled': True,
  1366. 'node_attr_dim': 0,
  1367. 'geometry': None,
  1368. 'edge_attr_dim': 0,
  1369. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_training.zip',
  1370. 'domain': 'small molecules',
  1371. },
  1372. 'Tox21_HSE_testing': {
  1373. 'database': 'tudataset',
  1374. 'reference': '[24]',
  1375. 'dataset_size': 267,
  1376. 'class_number': 2,
  1377. 'task_type': 'classification',
  1378. 'ave_node_num': 22.07,
  1379. 'ave_edge_num': 23.0,
  1380. 'node_labeled': True,
  1381. 'edge_labeled': True,
  1382. 'node_attr_dim': 0,
  1383. 'geometry': None,
  1384. 'edge_attr_dim': 0,
  1385. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_testing.zip',
  1386. 'domain': 'small molecules',
  1387. },
  1388. 'Tox21_HSE_evaluation': {
  1389. 'database': 'tudataset',
  1390. 'reference': '[24]',
  1391. 'dataset_size': 607,
  1392. 'class_number': 2,
  1393. 'task_type': 'classification',
  1394. 'ave_node_num': 17.61,
  1395. 'ave_edge_num': 18.01,
  1396. 'node_labeled': True,
  1397. 'edge_labeled': True,
  1398. 'node_attr_dim': 0,
  1399. 'geometry': None,
  1400. 'edge_attr_dim': 0,
  1401. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_evaluation.zip',
  1402. 'domain': 'small molecules',
  1403. },
  1404. 'Tox21_MMP_training': {
  1405. 'database': 'tudataset',
  1406. 'reference': '[24]',
  1407. 'dataset_size': 7320,
  1408. 'class_number': 2,
  1409. 'task_type': 'classification',
  1410. 'ave_node_num': 17.49,
  1411. 'ave_edge_num': 17.83,
  1412. 'node_labeled': True,
  1413. 'edge_labeled': True,
  1414. 'node_attr_dim': 0,
  1415. 'geometry': None,
  1416. 'edge_attr_dim': 0,
  1417. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_training.zip',
  1418. 'domain': 'small molecules',
  1419. },
  1420. 'Tox21_MMP_testing': {
  1421. 'database': 'tudataset',
  1422. 'reference': '[24]',
  1423. 'dataset_size': 238,
  1424. 'class_number': 2,
  1425. 'task_type': 'classification',
  1426. 'ave_node_num': 21.68,
  1427. 'ave_edge_num': 22.55,
  1428. 'node_labeled': True,
  1429. 'edge_labeled': True,
  1430. 'node_attr_dim': 0,
  1431. 'geometry': None,
  1432. 'edge_attr_dim': 0,
  1433. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_testing.zip',
  1434. 'domain': 'small molecules',
  1435. },
  1436. 'Tox21_MMP_evaluation': {
  1437. 'database': 'tudataset',
  1438. 'reference': '[24]',
  1439. 'dataset_size': 541,
  1440. 'class_number': 2,
  1441. 'task_type': 'classification',
  1442. 'ave_node_num': 16.67,
  1443. 'ave_edge_num': 16.88,
  1444. 'node_labeled': True,
  1445. 'edge_labeled': True,
  1446. 'node_attr_dim': 0,
  1447. 'geometry': None,
  1448. 'edge_attr_dim': 0,
  1449. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_evaluation.zip',
  1450. 'domain': 'small molecules',
  1451. },
  1452. 'Tox21_p53_training': {
  1453. 'database': 'tudataset',
  1454. 'reference': '[24]',
  1455. 'dataset_size': 8634,
  1456. 'class_number': 2,
  1457. 'task_type': 'classification',
  1458. 'ave_node_num': 17.79,
  1459. 'ave_edge_num': 18.19,
  1460. 'node_labeled': True,
  1461. 'edge_labeled': True,
  1462. 'node_attr_dim': 0,
  1463. 'geometry': None,
  1464. 'edge_attr_dim': 0,
  1465. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_training.zip',
  1466. 'domain': 'small molecules',
  1467. },
  1468. 'Tox21_p53_testing': {
  1469. 'database': 'tudataset',
  1470. 'reference': '[24]',
  1471. 'dataset_size': 269,
  1472. 'class_number': 2,
  1473. 'task_type': 'classification',
  1474. 'ave_node_num': 22.14,
  1475. 'ave_edge_num': 23.04,
  1476. 'node_labeled': True,
  1477. 'edge_labeled': True,
  1478. 'node_attr_dim': 0,
  1479. 'geometry': None,
  1480. 'edge_attr_dim': 0,
  1481. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_testing.zip',
  1482. 'domain': 'small molecules',
  1483. },
  1484. 'Tox21_p53_evaluation': {
  1485. 'database': 'tudataset',
  1486. 'reference': '[24]',
  1487. 'dataset_size': 613,
  1488. 'class_number': 2,
  1489. 'task_type': 'classification',
  1490. 'ave_node_num': 17.34,
  1491. 'ave_edge_num': 17.72,
  1492. 'node_labeled': True,
  1493. 'edge_labeled': True,
  1494. 'node_attr_dim': 0,
  1495. 'geometry': None,
  1496. 'edge_attr_dim': 0,
  1497. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_evaluation.zip',
  1498. 'domain': 'small molecules',
  1499. },
  1500. 'Tox21_PPAR-gamma_training': {
  1501. 'database': 'tudataset',
  1502. 'reference': '[24]',
  1503. 'dataset_size': 8184,
  1504. 'class_number': 2,
  1505. 'task_type': 'classification',
  1506. 'ave_node_num': 17.23,
  1507. 'ave_edge_num': 17.55,
  1508. 'node_labeled': True,
  1509. 'edge_labeled': True,
  1510. 'node_attr_dim': 0,
  1511. 'geometry': None,
  1512. 'edge_attr_dim': 0,
  1513. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_training.zip',
  1514. 'domain': 'small molecules',
  1515. },
  1516. 'Tox21_PPAR-gamma_testing': {
  1517. 'database': 'tudataset',
  1518. 'reference': '[24]',
  1519. 'dataset_size': 267,
  1520. 'class_number': 2,
  1521. 'task_type': 'classification',
  1522. 'ave_node_num': 22.04,
  1523. 'ave_edge_num': 22.93,
  1524. 'node_labeled': True,
  1525. 'edge_labeled': True,
  1526. 'node_attr_dim': 0,
  1527. 'geometry': None,
  1528. 'edge_attr_dim': 0,
  1529. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_testing.zip',
  1530. 'domain': 'small molecules',
  1531. },
  1532. 'Tox21_PPAR-gamma_evaluation': {
  1533. 'database': 'tudataset',
  1534. 'reference': '[24]',
  1535. 'dataset_size': 602,
  1536. 'class_number': 2,
  1537. 'task_type': 'classification',
  1538. 'ave_node_num': 17.38,
  1539. 'ave_edge_num': 17.77,
  1540. 'node_labeled': True,
  1541. 'edge_labeled': True,
  1542. 'node_attr_dim': 0,
  1543. 'geometry': None,
  1544. 'edge_attr_dim': 0,
  1545. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_evaluation.zip',
  1546. 'domain': 'small molecules',
  1547. },
  1548. 'UACC257': {
  1549. 'database': 'tudataset',
  1550. 'reference': '[28]',
  1551. 'dataset_size': 39988,
  1552. 'class_number': 2,
  1553. 'task_type': 'classification',
  1554. 'ave_node_num': 26.09,
  1555. 'ave_edge_num': 28.12,
  1556. 'node_labeled': True,
  1557. 'edge_labeled': True,
  1558. 'node_attr_dim': 0,
  1559. 'geometry': None,
  1560. 'edge_attr_dim': 0,
  1561. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/UACC257.zip',
  1562. 'domain': 'small molecules',
  1563. },
  1564. 'UACC257H': {
  1565. 'database': 'tudataset',
  1566. 'reference': '[28]',
  1567. 'dataset_size': 39988,
  1568. 'class_number': 2,
  1569. 'task_type': 'classification',
  1570. 'ave_node_num': 46.68,
  1571. 'ave_edge_num': 48.71,
  1572. 'node_labeled': True,
  1573. 'edge_labeled': True,
  1574. 'node_attr_dim': 0,
  1575. 'geometry': None,
  1576. 'edge_attr_dim': 0,
  1577. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/UACC257H.zip',
  1578. 'domain': 'small molecules',
  1579. },
  1580. 'uracil': {
  1581. 'database': 'tudataset',
  1582. 'reference': '[36]',
  1583. 'dataset_size': 133770,
  1584. 'class_number': None,
  1585. 'task_type': 'regression',
  1586. 'ave_node_num': 12.0,
  1587. 'ave_edge_num': 64.44,
  1588. 'node_labeled': True,
  1589. 'edge_labeled': False,
  1590. 'node_attr_dim': 6,
  1591. 'geometry': '3D, RI',
  1592. 'edge_attr_dim': 0,
  1593. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/uracil.zip',
  1594. 'domain': 'small molecules',
  1595. },
  1596. 'Yeast': {
  1597. 'database': 'tudataset',
  1598. 'reference': '[28]',
  1599. 'dataset_size': 79601,
  1600. 'class_number': 2,
  1601. 'task_type': 'classification',
  1602. 'ave_node_num': 21.54,
  1603. 'ave_edge_num': 22.84,
  1604. 'node_labeled': True,
  1605. 'edge_labeled': True,
  1606. 'node_attr_dim': 0,
  1607. 'geometry': None,
  1608. 'edge_attr_dim': 0,
  1609. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Yeast.zip',
  1610. 'domain': 'small molecules',
  1611. },
  1612. 'YeastH': {
  1613. 'database': 'tudataset',
  1614. 'reference': '[28]',
  1615. 'dataset_size': 79601,
  1616. 'class_number': 2,
  1617. 'task_type': 'classification',
  1618. 'ave_node_num': 39.44,
  1619. 'ave_edge_num': 40.74,
  1620. 'node_labeled': True,
  1621. 'edge_labeled': True,
  1622. 'node_attr_dim': 0,
  1623. 'geometry': None,
  1624. 'edge_attr_dim': 0,
  1625. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/YeastH.zip',
  1626. 'domain': 'small molecules',
  1627. },
  1628. 'ZINC_full': {
  1629. 'database': 'tudataset',
  1630. 'reference': '[31]',
  1631. 'dataset_size': 249456,
  1632. 'class_number': None,
  1633. 'task_type': 'regression',
  1634. 'ave_node_num': 23.14,
  1635. 'ave_edge_num': 24.91,
  1636. 'node_labeled': True,
  1637. 'edge_labeled': True,
  1638. 'node_attr_dim': 0,
  1639. 'geometry': None,
  1640. 'edge_attr_dim': 0,
  1641. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_full.zip',
  1642. 'domain': 'small molecules',
  1643. },
  1644. 'ZINC_test': {
  1645. 'database': 'tudataset',
  1646. 'reference': '[31]',
  1647. 'dataset_size': 5000,
  1648. 'class_number': None,
  1649. 'task_type': 'regression',
  1650. 'ave_node_num': 23.1,
  1651. 'ave_edge_num': 24.83,
  1652. 'node_labeled': True,
  1653. 'edge_labeled': True,
  1654. 'node_attr_dim': 0,
  1655. 'geometry': None,
  1656. 'edge_attr_dim': 0,
  1657. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_test.zip',
  1658. 'domain': 'small molecules',
  1659. },
  1660. 'ZINC_train': {
  1661. 'database': 'tudataset',
  1662. 'reference': '[31]',
  1663. 'dataset_size': 220011,
  1664. 'class_number': None,
  1665. 'task_type': 'regression',
  1666. 'ave_node_num': 23.15,
  1667. 'ave_edge_num': 24.91,
  1668. 'node_labeled': True,
  1669. 'edge_labeled': True,
  1670. 'node_attr_dim': 0,
  1671. 'geometry': None,
  1672. 'edge_attr_dim': 0,
  1673. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_train.zip',
  1674. 'domain': 'small molecules',
  1675. },
  1676. 'ZINC_val': {
  1677. 'database': 'tudataset',
  1678. 'reference': '[31]',
  1679. 'dataset_size': 24445,
  1680. 'class_number': None,
  1681. 'task_type': 'regression',
  1682. 'ave_node_num': 23.13,
  1683. 'ave_edge_num': 24.88,
  1684. 'node_labeled': True,
  1685. 'edge_labeled': True,
  1686. 'node_attr_dim': 0,
  1687. 'geometry': None,
  1688. 'edge_attr_dim': 0,
  1689. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_val.zip',
  1690. 'domain': 'small molecules',
  1691. },
  1692. ### bioinformatics
  1693. 'DD': {
  1694. 'database': 'tudataset',
  1695. 'reference': '[6,22]',
  1696. 'dataset_size': 1178,
  1697. 'class_number': 2,
  1698. 'task_type': 'classification',
  1699. 'ave_node_num': 284.32,
  1700. 'ave_edge_num': 715.66,
  1701. 'node_labeled': True,
  1702. 'edge_labeled': False,
  1703. 'node_attr_dim': 0,
  1704. 'geometry': None,
  1705. 'edge_attr_dim': 0,
  1706. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DD.zip',
  1707. 'domain': 'bioinformatics',
  1708. },
  1709. 'ENZYMES': {
  1710. 'database': 'tudataset',
  1711. 'reference': '[4,5]',
  1712. 'dataset_size': 600,
  1713. 'class_number': 6,
  1714. 'task_type': 'classification',
  1715. 'ave_node_num': 32.63,
  1716. 'ave_edge_num': 62.14,
  1717. 'node_labeled': True,
  1718. 'edge_labeled': False,
  1719. 'node_attr_dim': 18,
  1720. 'geometry': None,
  1721. 'edge_attr_dim': 0,
  1722. 'url': 'http://www.chrsmrrs.com/graphkerneldatasets/ENZYMES.zip',
  1723. 'domain': 'bioinformatics',
  1724. },
  1725. 'KKI': {
  1726. 'database': 'tudataset',
  1727. 'reference': '[26]',
  1728. 'dataset_size': 83,
  1729. 'class_number': 2,
  1730. 'task_type': 'classification',
  1731. 'ave_node_num': 26.96,
  1732. 'ave_edge_num': 48.42,
  1733. 'node_labeled': True,
  1734. 'edge_labeled': False,
  1735. 'node_attr_dim': 0,
  1736. 'geometry': None,
  1737. 'edge_attr_dim': 0,
  1738. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/KKI.zip',
  1739. 'domain': 'bioinformatics',
  1740. },
  1741. 'OHSU': {
  1742. 'database': 'tudataset',
  1743. 'reference': '[26]',
  1744. 'dataset_size': 79,
  1745. 'class_number': 2,
  1746. 'task_type': 'classification',
  1747. 'ave_node_num': 82.01,
  1748. 'ave_edge_num': 199.66,
  1749. 'node_labeled': True,
  1750. 'edge_labeled': False,
  1751. 'node_attr_dim': 0,
  1752. 'geometry': None,
  1753. 'edge_attr_dim': 0,
  1754. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OHSU.zip',
  1755. 'domain': 'bioinformatics',
  1756. },
  1757. 'Peking_1': {
  1758. 'database': 'tudataset',
  1759. 'reference': '[26]',
  1760. 'dataset_size': 85,
  1761. 'class_number': 2,
  1762. 'task_type': 'classification',
  1763. 'ave_node_num': 39.31,
  1764. 'ave_edge_num': 77.35,
  1765. 'node_labeled': True,
  1766. 'edge_labeled': False,
  1767. 'node_attr_dim': 0,
  1768. 'geometry': None,
  1769. 'edge_attr_dim': 0,
  1770. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Peking_1.zip',
  1771. 'domain': 'bioinformatics',
  1772. },
  1773. 'PROTEINS': {
  1774. 'database': 'tudataset',
  1775. 'reference': '[4,6]',
  1776. 'dataset_size': 1113,
  1777. 'class_number': 2,
  1778. 'task_type': 'classification',
  1779. 'ave_node_num': 39.06,
  1780. 'ave_edge_num': 72.82,
  1781. 'node_labeled': True,
  1782. 'edge_labeled': False,
  1783. 'node_attr_dim': 1,
  1784. 'geometry': None,
  1785. 'edge_attr_dim': 0,
  1786. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PROTEINS.zip',
  1787. 'domain': 'bioinformatics',
  1788. },
  1789. 'PROTEINS_full': {
  1790. 'database': 'tudataset',
  1791. 'reference': '[4,6]',
  1792. 'dataset_size': 1113,
  1793. 'class_number': 2,
  1794. 'task_type': 'classification',
  1795. 'ave_node_num': 39.06,
  1796. 'ave_edge_num': 72.82,
  1797. 'node_labeled': True,
  1798. 'edge_labeled': False,
  1799. 'node_attr_dim': 29,
  1800. 'geometry': None,
  1801. 'edge_attr_dim': 0,
  1802. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PROTEINS_full.zip',
  1803. 'domain': 'bioinformatics',
  1804. },
  1805. ### computer vision
  1806. 'COIL-DEL': {
  1807. 'database': 'tudataset',
  1808. 'reference': '[16,18]',
  1809. 'dataset_size': 3900,
  1810. 'class_number': 100,
  1811. 'task_type': 'classification',
  1812. 'ave_node_num': 21.54,
  1813. 'ave_edge_num': 54.24,
  1814. 'node_labeled': False,
  1815. 'edge_labeled': True,
  1816. 'node_attr_dim': 2,
  1817. 'geometry': None,
  1818. 'edge_attr_dim': 0,
  1819. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COIL-DEL.zip',
  1820. 'domain': 'computer vision',
  1821. },
  1822. 'COIL-RAG': {
  1823. 'database': 'tudataset',
  1824. 'reference': '[16,18]',
  1825. 'dataset_size': 3900,
  1826. 'class_number': 100,
  1827. 'task_type': 'classification',
  1828. 'ave_node_num': 3.01,
  1829. 'ave_edge_num': 3.02,
  1830. 'node_labeled': False,
  1831. 'edge_labeled': False,
  1832. 'node_attr_dim': 64,
  1833. 'geometry': None,
  1834. 'edge_attr_dim': 1,
  1835. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COIL-RAG.zip',
  1836. 'domain': 'computer vision',
  1837. },
  1838. 'Cuneiform': {
  1839. 'database': 'tudataset',
  1840. 'reference': '[25]',
  1841. 'dataset_size': 267,
  1842. 'class_number': 30,
  1843. 'task_type': 'classification',
  1844. 'ave_node_num': 21.27,
  1845. 'ave_edge_num': 44.8,
  1846. 'node_labeled': True,
  1847. 'edge_labeled': True,
  1848. 'node_attr_dim': 3,
  1849. 'geometry': '3D',
  1850. 'edge_attr_dim': 2,
  1851. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Cuneiform.zip',
  1852. 'domain': 'computer vision',
  1853. },
  1854. 'Fingerprint': {
  1855. 'database': 'tudataset',
  1856. 'reference': '[16,19]',
  1857. 'dataset_size': 2800,
  1858. 'class_number': 4,
  1859. 'task_type': 'classification',
  1860. 'ave_node_num': 5.42,
  1861. 'ave_edge_num': 4.42,
  1862. 'node_labeled': False,
  1863. 'edge_labeled': False,
  1864. 'node_attr_dim': 2,
  1865. 'geometry': '2D',
  1866. 'edge_attr_dim': 2,
  1867. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Fingerprint.zip',
  1868. 'domain': 'computer vision',
  1869. },
  1870. 'FIRSTMM_DB': {
  1871. 'database': 'tudataset',
  1872. 'reference': '[11,12,13]',
  1873. 'dataset_size': 41,
  1874. 'class_number': 11,
  1875. 'task_type': 'classification',
  1876. 'ave_node_num': 1377.27,
  1877. 'ave_edge_num': 3074.1,
  1878. 'node_labeled': True,
  1879. 'edge_labeled': False,
  1880. 'node_attr_dim': 1,
  1881. 'geometry': None,
  1882. 'edge_attr_dim': 2,
  1883. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/FIRSTMM_DB.zip',
  1884. 'domain': 'computer vision',
  1885. },
  1886. 'Letter-high': {
  1887. 'database': 'tudataset',
  1888. 'reference': '[16]',
  1889. 'dataset_size': 2250,
  1890. 'class_number': 15,
  1891. 'task_type': 'classification',
  1892. 'ave_node_num': 4.67,
  1893. 'ave_edge_num': 4.5,
  1894. 'node_labeled': False,
  1895. 'edge_labeled': False,
  1896. 'node_attr_dim': 2,
  1897. 'geometry': '2D',
  1898. 'edge_attr_dim': 0,
  1899. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-high.zip',
  1900. 'domain': 'computer vision',
  1901. },
  1902. 'Letter-low': {
  1903. 'database': 'tudataset',
  1904. 'reference': '[16]',
  1905. 'dataset_size': 2250,
  1906. 'class_number': 15,
  1907. 'task_type': 'classification',
  1908. 'ave_node_num': 4.68,
  1909. 'ave_edge_num': 3.13,
  1910. 'node_labeled': False,
  1911. 'edge_labeled': False,
  1912. 'node_attr_dim': 2,
  1913. 'geometry': '2D',
  1914. 'edge_attr_dim': 0,
  1915. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-low.zip',
  1916. 'domain': 'computer vision',
  1917. },
  1918. 'Letter-med': {
  1919. 'database': 'tudataset',
  1920. 'reference': '[16]',
  1921. 'dataset_size': 2250,
  1922. 'class_number': 15,
  1923. 'task_type': 'classification',
  1924. 'ave_node_num': 4.67,
  1925. 'ave_edge_num': 4.5,
  1926. 'node_labeled': False,
  1927. 'edge_labeled': False,
  1928. 'node_attr_dim': 2,
  1929. 'geometry': '2D',
  1930. 'edge_attr_dim': 0,
  1931. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-med.zip',
  1932. 'domain': 'computer vision',
  1933. },
  1934. 'MSRC_9': {
  1935. 'database': 'tudataset',
  1936. 'reference': '[13]',
  1937. 'dataset_size': 221,
  1938. 'class_number': 8,
  1939. 'task_type': 'classification',
  1940. 'ave_node_num': 40.58,
  1941. 'ave_edge_num': 97.94,
  1942. 'node_labeled': True,
  1943. 'edge_labeled': False,
  1944. 'node_attr_dim': 0,
  1945. 'geometry': None,
  1946. 'edge_attr_dim': 0,
  1947. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_9.zip',
  1948. 'domain': 'computer vision',
  1949. },
  1950. 'MSRC_21': {
  1951. 'database': 'tudataset',
  1952. 'reference': '[13]',
  1953. 'dataset_size': 563,
  1954. 'class_number': 20,
  1955. 'task_type': 'classification',
  1956. 'ave_node_num': 77.52,
  1957. 'ave_edge_num': 198.32,
  1958. 'node_labeled': True,
  1959. 'edge_labeled': False,
  1960. 'node_attr_dim': 0,
  1961. 'geometry': None,
  1962. 'edge_attr_dim': 0,
  1963. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_21.zip',
  1964. 'domain': 'computer vision',
  1965. },
  1966. 'MSRC_21C': {
  1967. 'database': 'tudataset',
  1968. 'reference': '[13]',
  1969. 'dataset_size': 209,
  1970. 'class_number': 20,
  1971. 'task_type': 'classification',
  1972. 'ave_node_num': 40.28,
  1973. 'ave_edge_num': 96.6,
  1974. 'node_labeled': True,
  1975. 'edge_labeled': False,
  1976. 'node_attr_dim': 0,
  1977. 'geometry': None,
  1978. 'edge_attr_dim': 0,
  1979. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_21C.zip',
  1980. 'domain': 'computer vision',
  1981. },
  1982. ### social networks
  1983. 'COLLAB': {
  1984. 'database': 'tudataset',
  1985. 'reference': '[14]',
  1986. 'dataset_size': 5000,
  1987. 'class_number': 3,
  1988. 'task_type': 'classification',
  1989. 'ave_node_num': 74.49,
  1990. 'ave_edge_num': 2457.78,
  1991. 'node_labeled': False,
  1992. 'edge_labeled': False,
  1993. 'node_attr_dim': 0,
  1994. 'geometry': None,
  1995. 'edge_attr_dim': 0,
  1996. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COLLAB.zip',
  1997. 'domain': 'social networks',
  1998. },
  1999. 'dblp_ct1': {
  2000. 'database': 'tudataset',
  2001. 'reference': '[32]',
  2002. 'dataset_size': 755,
  2003. 'class_number': 2,
  2004. 'task_type': 'classification',
  2005. 'ave_node_num': 52.87,
  2006. 'ave_edge_num': 320.09,
  2007. 'node_labeled': False,
  2008. 'edge_labeled': False,
  2009. 'node_attr_dim': 0,
  2010. 'geometry': None,
  2011. 'edge_attr_dim': 'temporal',
  2012. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/dblp_ct1.zip',
  2013. 'domain': 'social networks',
  2014. },
  2015. 'dblp_ct2': {
  2016. 'database': 'tudataset',
  2017. 'reference': '[32]',
  2018. 'dataset_size': 755,
  2019. 'class_number': 2,
  2020. 'task_type': 'classification',
  2021. 'ave_node_num': 52.87,
  2022. 'ave_edge_num': 320.09,
  2023. 'node_labeled': False,
  2024. 'edge_labeled': False,
  2025. 'node_attr_dim': 0,
  2026. 'geometry': None,
  2027. 'edge_attr_dim': 'temporal',
  2028. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/dblp_ct2.zip',
  2029. 'domain': 'social networks',
  2030. },
  2031. 'DBLP_v1': {
  2032. 'database': 'tudataset',
  2033. 'reference': '[26]',
  2034. 'dataset_size': 19456,
  2035. 'class_number': 2,
  2036. 'task_type': 'classification',
  2037. 'ave_node_num': 10.48,
  2038. 'ave_edge_num': 19.65,
  2039. 'node_labeled': True,
  2040. 'edge_labeled': True,
  2041. 'node_attr_dim': 0,
  2042. 'geometry': None,
  2043. 'edge_attr_dim': 0,
  2044. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DBLP_v1.zip',
  2045. 'domain': 'social networks',
  2046. },
  2047. 'deezer_ego_nets': {
  2048. 'database': 'tudataset',
  2049. 'reference': '[30]',
  2050. 'dataset_size': 9629,
  2051. 'class_number': 2,
  2052. 'task_type': 'classification',
  2053. 'ave_node_num': 23.49,
  2054. 'ave_edge_num': 65.25,
  2055. 'node_labeled': False,
  2056. 'edge_labeled': False,
  2057. 'node_attr_dim': 0,
  2058. 'geometry': None,
  2059. 'edge_attr_dim': 0,
  2060. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/deezer_ego_nets.zip',
  2061. 'domain': 'social networks',
  2062. },
  2063. 'facebook_ct1': {
  2064. 'database': 'tudataset',
  2065. 'reference': '[32]',
  2066. 'dataset_size': 995,
  2067. 'class_number': 2,
  2068. 'task_type': 'classification',
  2069. 'ave_node_num': 95.72,
  2070. 'ave_edge_num': 269.01,
  2071. 'node_labeled': False,
  2072. 'edge_labeled': False,
  2073. 'node_attr_dim': 0,
  2074. 'geometry': None,
  2075. 'edge_attr_dim': 'temporal',
  2076. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/facebook_ct1.zip',
  2077. 'domain': 'social networks',
  2078. },
  2079. 'facebook_ct2': {
  2080. 'database': 'tudataset',
  2081. 'reference': '[32]',
  2082. 'dataset_size': 995,
  2083. 'class_number': 2,
  2084. 'task_type': 'classification',
  2085. 'ave_node_num': 95.72,
  2086. 'ave_edge_num': 269.01,
  2087. 'node_labeled': False,
  2088. 'edge_labeled': False,
  2089. 'node_attr_dim': 0,
  2090. 'geometry': None,
  2091. 'edge_attr_dim': 'temporal',
  2092. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/facebook_ct2.zip',
  2093. 'domain': 'social networks',
  2094. },
  2095. 'github_stargazers': {
  2096. 'database': 'tudataset',
  2097. 'reference': '[30]',
  2098. 'dataset_size': 12725,
  2099. 'class_number': 2,
  2100. 'task_type': 'classification',
  2101. 'ave_node_num': 113.79,
  2102. 'ave_edge_num': 234.64,
  2103. 'node_labeled': False,
  2104. 'edge_labeled': False,
  2105. 'node_attr_dim': 0,
  2106. 'geometry': None,
  2107. 'edge_attr_dim': 0,
  2108. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/github_stargazers.zip',
  2109. 'domain': 'social networks',
  2110. },
  2111. 'highschool_ct1': {
  2112. 'database': 'tudataset',
  2113. 'reference': '[32]',
  2114. 'dataset_size': 180,
  2115. 'class_number': 2,
  2116. 'task_type': 'classification',
  2117. 'ave_node_num': 52.32,
  2118. 'ave_edge_num': 544.81,
  2119. 'node_labeled': False,
  2120. 'edge_labeled': False,
  2121. 'node_attr_dim': 0,
  2122. 'geometry': None,
  2123. 'edge_attr_dim': 'temporal',
  2124. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/highschool_ct1.zip',
  2125. 'domain': 'social networks',
  2126. },
  2127. 'highschool_ct2': {
  2128. 'database': 'tudataset',
  2129. 'reference': '[32]',
  2130. 'dataset_size': 180,
  2131. 'class_number': 2,
  2132. 'task_type': 'classification',
  2133. 'ave_node_num': 52.32,
  2134. 'ave_edge_num': 544.81,
  2135. 'node_labeled': False,
  2136. 'edge_labeled': False,
  2137. 'node_attr_dim': 0,
  2138. 'geometry': None,
  2139. 'edge_attr_dim': 'temporal',
  2140. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/highschool_ct2.zip',
  2141. 'domain': 'social networks',
  2142. },
  2143. 'IMDB-BINARY': {
  2144. 'database': 'tudataset',
  2145. 'reference': '[14]',
  2146. 'dataset_size': 1000,
  2147. 'class_number': 2,
  2148. 'task_type': 'classification',
  2149. 'ave_node_num': 19.77,
  2150. 'ave_edge_num': 96.53,
  2151. 'node_labeled': False,
  2152. 'edge_labeled': False,
  2153. 'node_attr_dim': 0,
  2154. 'geometry': '',
  2155. 'edge_attr_dim': 0,
  2156. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/IMDB-BINARY.zip',
  2157. 'domain': 'social networks',
  2158. },
  2159. 'IMDB-MULTI': {
  2160. 'database': 'tudataset',
  2161. 'reference': '[14]',
  2162. 'dataset_size': 1500,
  2163. 'class_number': 3,
  2164. 'task_type': 'classification',
  2165. 'ave_node_num': 13.0,
  2166. 'ave_edge_num': 65.94,
  2167. 'node_labeled': False,
  2168. 'edge_labeled': False,
  2169. 'node_attr_dim': 0,
  2170. 'geometry': '',
  2171. 'edge_attr_dim': 0,
  2172. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/IMDB-MULTI.zip',
  2173. 'domain': 'social networks',
  2174. },
  2175. 'infectious_ct1': {
  2176. 'database': 'tudataset',
  2177. 'reference': '[32]',
  2178. 'dataset_size': 200,
  2179. 'class_number': 2,
  2180. 'task_type': 'classification',
  2181. 'ave_node_num': 50.0,
  2182. 'ave_edge_num': 459.72,
  2183. 'node_labeled': False,
  2184. 'edge_labeled': False,
  2185. 'node_attr_dim': 0,
  2186. 'geometry': None,
  2187. 'edge_attr_dim': 'temporal',
  2188. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/infectious_ct1.zip',
  2189. 'domain': 'social networks',
  2190. },
  2191. 'infectious_ct2': {
  2192. 'database': 'tudataset',
  2193. 'reference': '[32]',
  2194. 'dataset_size': 200,
  2195. 'class_number': 2,
  2196. 'task_type': 'classification',
  2197. 'ave_node_num': 50.0,
  2198. 'ave_edge_num': 459.72,
  2199. 'node_labeled': False,
  2200. 'edge_labeled': False,
  2201. 'node_attr_dim': 0,
  2202. 'geometry': None,
  2203. 'edge_attr_dim': 'temporal',
  2204. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/infectious_ct2.zip',
  2205. 'domain': 'social networks',
  2206. },
  2207. 'mit_ct1': {
  2208. 'database': 'tudataset',
  2209. 'reference': '[32]',
  2210. 'dataset_size': 97,
  2211. 'class_number': 2,
  2212. 'task_type': 'classification',
  2213. 'ave_node_num': 20.0,
  2214. 'ave_edge_num': 1469.15,
  2215. 'node_labeled': False,
  2216. 'edge_labeled': False,
  2217. 'node_attr_dim': 0,
  2218. 'geometry': None,
  2219. 'edge_attr_dim': 'temporal',
  2220. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/mit_ct1.zip',
  2221. 'domain': 'social networks',
  2222. },
  2223. 'mit_ct2': {
  2224. 'database': 'tudataset',
  2225. 'reference': '[32]',
  2226. 'dataset_size': 97,
  2227. 'class_number': 2,
  2228. 'task_type': 'classification',
  2229. 'ave_node_num': 20.0,
  2230. 'ave_edge_num': 1469.15,
  2231. 'node_labeled': False,
  2232. 'edge_labeled': False,
  2233. 'node_attr_dim': 0,
  2234. 'geometry': None,
  2235. 'edge_attr_dim': 'temporal',
  2236. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/mit_ct2.zip',
  2237. 'domain': 'social networks',
  2238. },
  2239. 'REDDIT-BINARY': {
  2240. 'database': 'tudataset',
  2241. 'reference': '[14]',
  2242. 'dataset_size': 2000,
  2243. 'class_number': 2,
  2244. 'task_type': 'classification',
  2245. 'ave_node_num': 429.63,
  2246. 'ave_edge_num': 497.75,
  2247. 'node_labeled': False,
  2248. 'edge_labeled': False,
  2249. 'node_attr_dim': 0,
  2250. 'geometry': None,
  2251. 'edge_attr_dim': 0,
  2252. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-BINARY.zip',
  2253. 'domain': 'social networks',
  2254. },
  2255. 'REDDIT-MULTI-5K': {
  2256. 'database': 'tudataset',
  2257. 'reference': '[14]',
  2258. 'dataset_size': 4999,
  2259. 'class_number': 5,
  2260. 'task_type': 'classification',
  2261. 'ave_node_num': 508.52,
  2262. 'ave_edge_num': 594.87,
  2263. 'node_labeled': False,
  2264. 'edge_labeled': False,
  2265. 'node_attr_dim': 0,
  2266. 'geometry': None,
  2267. 'edge_attr_dim': 0,
  2268. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-MULTI-5K.zip',
  2269. 'domain': 'social networks',
  2270. },
  2271. 'REDDIT-MULTI-12K': {
  2272. 'database': 'tudataset',
  2273. 'reference': '[14]',
  2274. 'dataset_size': 11929,
  2275. 'class_number': 11,
  2276. 'task_type': 'classification',
  2277. 'ave_node_num': 391.41,
  2278. 'ave_edge_num': 456.89,
  2279. 'node_labeled': False,
  2280. 'edge_labeled': False,
  2281. 'node_attr_dim': 0,
  2282. 'geometry': None,
  2283. 'edge_attr_dim': 0,
  2284. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-MULTI-12K.zip',
  2285. 'domain': 'social networks',
  2286. },
  2287. 'reddit_threads': {
  2288. 'database': 'tudataset',
  2289. 'reference': '[30]',
  2290. 'dataset_size': 203088,
  2291. 'class_number': 2,
  2292. 'task_type': 'classification',
  2293. 'ave_node_num': 23.93,
  2294. 'ave_edge_num': 24.99,
  2295. 'node_labeled': False,
  2296. 'edge_labeled': False,
  2297. 'node_attr_dim': 0,
  2298. 'geometry': None,
  2299. 'edge_attr_dim': 0,
  2300. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/reddit_threads.zip',
  2301. 'domain': 'social networks',
  2302. },
  2303. 'tumblr_ct1': {
  2304. 'database': 'tudataset',
  2305. 'reference': '[32]',
  2306. 'dataset_size': 373,
  2307. 'class_number': 2,
  2308. 'task_type': 'classification',
  2309. 'ave_node_num': 53.11,
  2310. 'ave_edge_num': 199.78,
  2311. 'node_labeled': False,
  2312. 'edge_labeled': False,
  2313. 'node_attr_dim': 0,
  2314. 'geometry': None,
  2315. 'edge_attr_dim': 'temporal',
  2316. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/tumblr_ct1.zip',
  2317. 'domain': 'social networks',
  2318. },
  2319. 'tumblr_ct2': {
  2320. 'database': 'tudataset',
  2321. 'reference': '[32]',
  2322. 'dataset_size': 373,
  2323. 'class_number': 2,
  2324. 'task_type': 'classification',
  2325. 'ave_node_num': 53.11,
  2326. 'ave_edge_num': 199.78,
  2327. 'node_labeled': False,
  2328. 'edge_labeled': False,
  2329. 'node_attr_dim': 0,
  2330. 'geometry': None,
  2331. 'edge_attr_dim': 'temporal',
  2332. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/tumblr_ct2.zip',
  2333. 'domain': 'social networks',
  2334. },
  2335. 'twitch_egos': {
  2336. 'database': 'tudataset',
  2337. 'reference': '[30]',
  2338. 'dataset_size': 127094,
  2339. 'class_number': 2,
  2340. 'task_type': 'classification',
  2341. 'ave_node_num': 29.67,
  2342. 'ave_edge_num': 86.59,
  2343. 'node_labeled': False,
  2344. 'edge_labeled': False,
  2345. 'node_attr_dim': 0,
  2346. 'geometry': None,
  2347. 'edge_attr_dim': 0,
  2348. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/twitch_egos.zip',
  2349. 'domain': 'social networks',
  2350. },
  2351. 'TWITTER-Real-Graph-Partial': {
  2352. 'database': 'tudataset',
  2353. 'reference': '[26]',
  2354. 'dataset_size': 144033,
  2355. 'class_number': 2,
  2356. 'task_type': 'classification',
  2357. 'ave_node_num': 4.03,
  2358. 'ave_edge_num': 4.98,
  2359. 'node_labeled': True,
  2360. 'edge_labeled': False,
  2361. 'node_attr_dim': 0,
  2362. 'geometry': None,
  2363. 'edge_attr_dim': 1,
  2364. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/TWITTER-Real-Graph-Partial.zip',
  2365. 'domain': 'social networks',
  2366. },
  2367. ### synthetic
  2368. 'COLORS-3': {
  2369. 'database': 'tudataset',
  2370. 'reference': '[27]',
  2371. 'dataset_size': 10500,
  2372. 'class_number': 11,
  2373. 'task_type': 'classification',
  2374. 'ave_node_num': 61.31,
  2375. 'ave_edge_num': 91.03,
  2376. 'node_labeled': False,
  2377. 'edge_labeled': False,
  2378. 'node_attr_dim': 4,
  2379. 'geometry': None,
  2380. 'edge_attr_dim': 0,
  2381. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COLORS-3.zip',
  2382. 'domain': 'synthetic',
  2383. },
  2384. 'SYNTHETIC': {
  2385. 'database': 'tudataset',
  2386. 'reference': '[3]',
  2387. 'dataset_size': 300,
  2388. 'class_number': 2,
  2389. 'task_type': 'classification',
  2390. 'ave_node_num': 100.0,
  2391. 'ave_edge_num': 196.0,
  2392. 'node_labeled': False,
  2393. 'edge_labeled': False,
  2394. 'node_attr_dim': 1,
  2395. 'geometry': None,
  2396. 'edge_attr_dim': 0,
  2397. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SYNTHETIC.zip',
  2398. 'domain': 'synthetic',
  2399. },
  2400. 'SYNTHETICnew': {
  2401. 'database': 'tudataset',
  2402. 'reference': '[3,10]',
  2403. 'dataset_size': 300,
  2404. 'class_number': 2,
  2405. 'task_type': 'classification',
  2406. 'ave_node_num': 100.0,
  2407. 'ave_edge_num': 196.25,
  2408. 'node_labeled': False,
  2409. 'edge_labeled': False,
  2410. 'node_attr_dim': 1,
  2411. 'geometry': None,
  2412. 'edge_attr_dim': 0,
  2413. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SYNTHETICnew.zip',
  2414. 'domain': 'synthetic',
  2415. },
  2416. 'Synthie': {
  2417. 'database': 'tudataset',
  2418. 'reference': '[21]',
  2419. 'dataset_size': 400,
  2420. 'class_number': 4,
  2421. 'task_type': 'classification',
  2422. 'ave_node_num': 95.0,
  2423. 'ave_edge_num': 172.93,
  2424. 'node_labeled': False,
  2425. 'edge_labeled': False,
  2426. 'node_attr_dim': 15,
  2427. 'geometry': None,
  2428. 'edge_attr_dim': 0,
  2429. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Synthie.zip',
  2430. 'domain': 'synthetic',
  2431. },
  2432. 'TRIANGLES': {
  2433. 'database': 'tudataset',
  2434. 'reference': '[27]',
  2435. 'dataset_size': 45000,
  2436. 'class_number': 10,
  2437. 'task_type': 'classification',
  2438. 'ave_node_num': 20.85,
  2439. 'ave_edge_num': 32.74,
  2440. 'node_labeled': False,
  2441. 'edge_labeled': False,
  2442. 'node_attr_dim': 0,
  2443. 'geometry': None,
  2444. 'edge_attr_dim': 0,
  2445. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/TRIANGLES.zip',
  2446. 'domain': 'synthetic',
  2447. },
  2448. }
  2449. DATASET_META = {**GREYC_META, **IAM_META, **TUDataset_META}
  2450. def list_of_databases():
  2451. """List names of all databases.
  2452. Returns
  2453. -------
  2454. list
  2455. The list of all databases.
  2456. """
  2457. return [i for i in DATABASES]
  2458. def list_of_datasets():
  2459. """List names of all datasets.
  2460. Returns
  2461. -------
  2462. list
  2463. The list of all datasets.
  2464. """
  2465. return [i for i in DATASET_META]

A Python package for graph kernels, graph edit distances and graph pre-image problem.