You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

metadata.py 65 kB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489
  1. #!/usr/bin/env python3
  2. # -*- coding: utf-8 -*-
  3. """
  4. Created on Tue Oct 20 14:25:49 2020
  5. @author: ljia
  6. """
  7. DATABASES = {
  8. 'greyc': 'https://brunl01.users.greyc.fr/CHEMISTRY/',
  9. 'iam': 'https://iapr-tc15.greyc.fr/IAM/',
  10. 'tudataset': 'http://graphlearning.io/docs/datasets/',
  11. }
  12. ### -------- database greyc -------- ###
  13. GREYC_META = {
  14. 'ACE': {
  15. 'database': 'greyc',
  16. 'reference': None,
  17. 'dataset_size': 32,
  18. 'class_number': 2,
  19. 'task_type': 'classification',
  20. 'ave_node_num': 52,
  21. 'ave_edge_num': None,
  22. 'node_labeled': None,
  23. 'edge_labeled': None,
  24. 'node_attr_dim': None,
  25. 'geometry': None,
  26. 'edge_attr_dim': None,
  27. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/ACEDataset.tar',
  28. 'domain': 'small molecules',
  29. 'train_valid_test': [],
  30. 'stereoisomerism': True,
  31. 'load_files': ['data.ds'],
  32. 'extra_params': {'gformat': 'cml'}
  33. },
  34. 'Acyclic': {
  35. 'database': 'greyc',
  36. 'reference': None,
  37. 'dataset_size': 183,
  38. 'class_number': None,
  39. 'task_type': 'regression',
  40. 'ave_node_num': 8.15,
  41. 'ave_edge_num': 7.15,
  42. 'node_labeled': True,
  43. 'edge_labeled': False,
  44. 'node_attr_dim': 0,
  45. 'geometry': None,
  46. 'edge_attr_dim': 0,
  47. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/Acyclic.tar.gz',
  48. 'domain': 'small molecules',
  49. 'train_valid_test': None,
  50. 'stereoisomerism': False,
  51. 'load_files': ['dataset_bps.ds'],
  52. },
  53. 'AIDS_greyc': {
  54. 'database': 'greyc',
  55. 'reference': None,
  56. 'dataset_size': 2000,
  57. 'class_number': 2,
  58. 'task_type': 'classification',
  59. 'ave_node_num': 15.69,
  60. 'ave_edge_num': 16.20,
  61. 'node_labeled': True,
  62. 'edge_labeled': True,
  63. 'node_attr_dim': None,
  64. 'geometry': None,
  65. 'edge_attr_dim': None,
  66. 'url': 'https://iapr-tc15.greyc.fr/IAM/AIDS.zip',
  67. 'domain': 'small molecules',
  68. 'train_valid_test': ['data/train.cxl', 'data/valid.cxl', 'data/test.cxl',],
  69. 'stereoisomerism': False,
  70. 'load_files': ['data/'],
  71. },
  72. 'Alkane': {
  73. 'database': 'greyc',
  74. 'reference': None,
  75. 'dataset_size': 150,
  76. 'class_number': None,
  77. 'task_type': 'regression',
  78. 'ave_node_num': 8.87,
  79. 'ave_edge_num': 7.87,
  80. 'node_labeled': False,
  81. 'edge_labeled': False,
  82. 'node_attr_dim': 0,
  83. 'geometry': None,
  84. 'edge_attr_dim': 0,
  85. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/alkane_dataset.tar.gz',
  86. 'domain': 'small molecules',
  87. 'train_valid_test': None,
  88. 'stereoisomerism': False,
  89. 'load_files': ['dataset.ds', 'dataset_boiling_point_names.txt'],
  90. },
  91. 'Chiral': {
  92. 'database': 'greyc',
  93. 'reference': None,
  94. 'dataset_size': 35,
  95. 'class_number': None,
  96. 'task_type': 'regression',
  97. 'ave_node_num': 21.29,
  98. 'ave_edge_num': None,
  99. 'node_labeled': None,
  100. 'edge_labeled': None,
  101. 'node_attr_dim': None,
  102. 'geometry': None,
  103. 'edge_attr_dim': None,
  104. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/DatasetAcyclicChiral.tar',
  105. 'domain': 'small molecules',
  106. 'train_valid_test': [],
  107. 'stereoisomerism': True,
  108. 'load_files': ['data.txt'],
  109. 'extra_params': {'gformat': 'cml'}
  110. },
  111. 'MAO': {
  112. 'database': 'greyc',
  113. 'reference': None,
  114. 'dataset_size': 68,
  115. 'class_number': 2,
  116. 'task_type': 'classification',
  117. 'ave_node_num': 18.38,
  118. 'ave_edge_num': 19.63,
  119. 'node_labeled': True,
  120. 'edge_labeled': True,
  121. 'node_attr_dim': 0,
  122. 'geometry': None,
  123. 'edge_attr_dim': 0,
  124. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/mao.tgz',
  125. 'domain': 'small molecules',
  126. 'train_valid_test': None,
  127. 'stereoisomerism': False,
  128. 'load_files': ['dataset.ds'],
  129. },
  130. 'Monoterpenoides': {
  131. 'database': 'greyc',
  132. 'reference': None,
  133. 'dataset_size': 382,
  134. 'class_number': 10,
  135. 'task_type': 'classification',
  136. 'ave_node_num': 10,
  137. 'ave_edge_num': None,
  138. 'node_labeled': None,
  139. 'edge_labeled': None,
  140. 'node_attr_dim': None,
  141. 'geometry': None,
  142. 'edge_attr_dim': None,
  143. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/monoterpenoides.tar.gz',
  144. 'domain': 'small molecules',
  145. 'train_valid_test': None,
  146. 'stereoisomerism': False,
  147. 'load_files': ['dataset_10+.ds'],
  148. },
  149. 'PAH': {
  150. 'database': 'greyc',
  151. 'reference': None,
  152. 'dataset_size': 94,
  153. 'class_number': 2,
  154. 'task_type': 'classification',
  155. 'ave_node_num': 20.7,
  156. 'ave_edge_num': 24.43,
  157. 'node_labeled': False,
  158. 'edge_labeled': False,
  159. 'node_attr_dim': 0,
  160. 'geometry': None,
  161. 'edge_attr_dim': 0,
  162. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/PAH.tar.gz',
  163. 'domain': 'small molecules',
  164. 'train_valid_test': ['trainset_0.ds', None, 'testset_0.ds'],
  165. 'stereoisomerism': False,
  166. 'load_files': [['trainset_0.ds', 'testset_0.ds']],
  167. },
  168. 'PTC': {
  169. 'database': 'greyc',
  170. 'reference': None,
  171. 'dataset_size': 416,
  172. 'class_number': None,
  173. 'task_type': 'classification',
  174. 'ave_node_num': 14.4,
  175. 'ave_edge_num': None,
  176. 'node_labeled': None,
  177. 'edge_labeled': None,
  178. 'node_attr_dim': None,
  179. 'geometry': None,
  180. 'edge_attr_dim': None,
  181. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/ptc.tgz',
  182. 'domain': 'small molecules',
  183. 'train_valid_test': None,
  184. 'stereoisomerism': False,
  185. 'load_files': [],
  186. 'extra_info': 'This dataset has test and train datasets. Select gender between mm, fm, mr, fr. \ndataloader = DataLoader(\'Ptc\',root = ..., option = \'mm\') \ntest,train = dataloader.dataset \nGs_test, y_test = test \nGs_train_, y_train = train',
  187. },
  188. 'Steroid': {
  189. 'database': 'greyc',
  190. 'reference': None,
  191. 'dataset_size': 64,
  192. 'class_number': None,
  193. 'task_type': 'regression',
  194. 'ave_node_num': 75.11,
  195. 'ave_edge_num': None,
  196. 'node_labeled': None,
  197. 'edge_labeled': None,
  198. 'node_attr_dim': None,
  199. 'geometry': None,
  200. 'edge_attr_dim': None,
  201. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/SteroidDataset.tar',
  202. 'domain': 'small molecules',
  203. 'train_valid_test': ['trainset_0.ds', None, 'testset_0.ds'],
  204. 'stereoisomerism': False,
  205. 'load_files': ['dataWithOutsider.ds'],
  206. 'extra_params': {'gformat': 'cml'}
  207. },
  208. 'Vitamin_D': {
  209. 'database': 'greyc',
  210. 'reference': None,
  211. 'dataset_size': 69,
  212. 'class_number': None,
  213. 'task_type': 'regression',
  214. 'ave_node_num': 76.91,
  215. 'ave_edge_num': None,
  216. 'node_labeled': None,
  217. 'edge_labeled': None,
  218. 'node_attr_dim': None,
  219. 'geometry': None,
  220. 'edge_attr_dim': None,
  221. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/DatasetVitamin.tar',
  222. 'domain': 'small molecules',
  223. 'train_valid_test': [],
  224. 'stereoisomerism': True,
  225. 'load_files': ['data.txt'],
  226. 'extra_params': {'gformat': 'cml'}
  227. },
  228. }
  229. ### -------- database iam -------- ###
  230. # @todo: several datasets in this database are included in TUDataset. However they do not include train/valid/test sets.
  231. IAM_META = {
  232. 'GREC': {
  233. 'database': 'iam',
  234. 'reference': None,
  235. 'dataset_size': None,
  236. 'class_number': None,
  237. 'task_type': None,
  238. 'ave_node_num': None,
  239. 'ave_edge_num': None,
  240. 'node_labeled': None,
  241. 'edge_labeled': None,
  242. 'node_attr_dim': None,
  243. 'geometry': None,
  244. 'edge_attr_dim': None,
  245. 'url': 'https://iapr-tc15.greyc.fr/IAM/GREC.zip',
  246. 'domain': None,
  247. 'train_valid_test': ['data/test.cxl','data/train.cxl', 'data/valid.cxl'],
  248. 'load_files': [['data/test.cxl','data/train.cxl', 'data/valid.cxl']],
  249. },
  250. 'Web': {
  251. 'database': 'iam',
  252. 'reference': None,
  253. 'dataset_size': None,
  254. 'class_number': None,
  255. 'task_type': None,
  256. 'ave_node_num': None,
  257. 'ave_edge_num': None,
  258. 'node_labeled': None,
  259. 'edge_labeled': None,
  260. 'node_attr_dim': None,
  261. 'geometry': None,
  262. 'edge_attr_dim': None,
  263. 'url': 'https://iapr-tc15.greyc.fr/IAM/Web.zip',
  264. 'domain': None,
  265. 'train_valid_test': ['data/test.cxl', 'data/train.cxl', 'data/valid.cxl'],
  266. 'load_files': [['data/test.cxl','data/train.cxl', 'data/valid.cxl']],
  267. },
  268. }
  269. ### -------- database tudataset -------- ###
  270. TUDataset_META = {
  271. ### small molecules
  272. 'AIDS': {
  273. 'database': 'tudataset',
  274. 'reference': '[16,17]',
  275. 'dataset_size': 2000,
  276. 'class_number': 2,
  277. 'task_type': 'classification',
  278. 'ave_node_num': 15.69,
  279. 'ave_edge_num': 16.2,
  280. 'node_labeled': True,
  281. 'edge_labeled': True,
  282. 'node_attr_dim': 4,
  283. 'geometry': None,
  284. 'edge_attr_dim': 0,
  285. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/AIDS.zip',
  286. 'domain': 'small molecules',
  287. },
  288. 'alchemy_full': {
  289. 'database': 'tudataset',
  290. 'reference': '[29]',
  291. 'dataset_size': 202579,
  292. 'class_number': None,
  293. 'task_type': 'regression',
  294. 'ave_node_num': 10.1,
  295. 'ave_edge_num': 10.44,
  296. 'node_labeled': True,
  297. 'edge_labeled': True,
  298. 'node_attr_dim': 3,
  299. 'geometry': '3D, RI',
  300. 'edge_attr_dim': 0,
  301. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/alchemy_full.zip',
  302. 'domain': 'small molecules',
  303. },
  304. 'aspirin': {
  305. 'database': 'tudataset',
  306. 'reference': '[36]',
  307. 'dataset_size': 111763,
  308. 'class_number': None,
  309. 'task_type': 'regression',
  310. 'ave_node_num': 21.0,
  311. 'ave_edge_num': 151.52,
  312. 'node_labeled': True,
  313. 'edge_labeled': False,
  314. 'node_attr_dim': 6,
  315. 'geometry': '3D, RI',
  316. 'edge_attr_dim': 0,
  317. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/aspirin.zip',
  318. 'domain': 'small molecules',
  319. },
  320. 'benzene': {
  321. 'database': 'tudataset',
  322. 'reference': '[36]',
  323. 'dataset_size': 527984,
  324. 'class_number': None,
  325. 'task_type': 'regression',
  326. 'ave_node_num': 12.0,
  327. 'ave_edge_num': 64.94,
  328. 'node_labeled': True,
  329. 'edge_labeled': False,
  330. 'node_attr_dim': 6,
  331. 'geometry': '3D, RI',
  332. 'edge_attr_dim': 0,
  333. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/benzene.zip',
  334. 'domain': 'small molecules',
  335. },
  336. 'BZR': {
  337. 'database': 'tudataset',
  338. 'reference': '[7]',
  339. 'dataset_size': 405,
  340. 'class_number': 2,
  341. 'task_type': 'classification',
  342. 'ave_node_num': 35.75,
  343. 'ave_edge_num': 38.36,
  344. 'node_labeled': True,
  345. 'edge_labeled': False,
  346. 'node_attr_dim': 3,
  347. 'geometry': '3D, RI',
  348. 'edge_attr_dim': 0,
  349. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/BZR.zip',
  350. 'domain': 'small molecules',
  351. },
  352. 'BZR_MD': {
  353. 'database': 'tudataset',
  354. 'reference': '[7,23]',
  355. 'dataset_size': 306,
  356. 'class_number': 2,
  357. 'task_type': 'classification',
  358. 'ave_node_num': 21.3,
  359. 'ave_edge_num': 225.06,
  360. 'node_labeled': True,
  361. 'edge_labeled': True,
  362. 'node_attr_dim': 0,
  363. 'geometry': None,
  364. 'edge_attr_dim': 1,
  365. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/BZR_MD.zip',
  366. 'domain': 'small molecules',
  367. },
  368. 'COX2': {
  369. 'database': 'tudataset',
  370. 'reference': '[7]',
  371. 'dataset_size': 467,
  372. 'class_number': 2,
  373. 'task_type': 'classification',
  374. 'ave_node_num': 41.22,
  375. 'ave_edge_num': 43.45,
  376. 'node_labeled': True,
  377. 'edge_labeled': False,
  378. 'node_attr_dim': 3,
  379. 'geometry': '3D, RI',
  380. 'edge_attr_dim': 0,
  381. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COX2.zip',
  382. 'domain': 'small molecules',
  383. },
  384. 'COX2_MD': {
  385. 'database': 'tudataset',
  386. 'reference': '[7,23]',
  387. 'dataset_size': 303,
  388. 'class_number': 2,
  389. 'task_type': 'classification',
  390. 'ave_node_num': 26.28,
  391. 'ave_edge_num': 335.12,
  392. 'node_labeled': True,
  393. 'edge_labeled': True,
  394. 'node_attr_dim': 0,
  395. 'geometry': None,
  396. 'edge_attr_dim': 1,
  397. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COX2_MD.zip',
  398. 'domain': 'small molecules',
  399. },
  400. 'DHFR': {
  401. 'database': 'tudataset',
  402. 'reference': '[7]',
  403. 'dataset_size': 467,
  404. 'class_number': 2,
  405. 'task_type': 'classification',
  406. 'ave_node_num': 42.43,
  407. 'ave_edge_num': 44.54,
  408. 'node_labeled': True,
  409. 'edge_labeled': False,
  410. 'node_attr_dim': 3,
  411. 'geometry': '3D, RI',
  412. 'edge_attr_dim': 0,
  413. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DHFR.zip',
  414. 'domain': 'small molecules',
  415. },
  416. 'DHFR_MD': {
  417. 'database': 'tudataset',
  418. 'reference': '[7,23]',
  419. 'dataset_size': 393,
  420. 'class_number': 2,
  421. 'task_type': 'classification',
  422. 'ave_node_num': 23.87,
  423. 'ave_edge_num': 283.01,
  424. 'node_labeled': True,
  425. 'edge_labeled': True,
  426. 'node_attr_dim': 0,
  427. 'geometry': None,
  428. 'edge_attr_dim': 1,
  429. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DHFR_MD.zip',
  430. 'domain': 'small molecules',
  431. },
  432. 'ER_MD': {
  433. 'database': 'tudataset',
  434. 'reference': '[7,23]',
  435. 'dataset_size': 446,
  436. 'class_number': 2,
  437. 'task_type': 'classification',
  438. 'ave_node_num': 21.33,
  439. 'ave_edge_num': 234.85,
  440. 'node_labeled': True,
  441. 'edge_labeled': True,
  442. 'node_attr_dim': 0,
  443. 'geometry': None,
  444. 'edge_attr_dim': 1,
  445. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ER_MD.zip',
  446. 'domain': 'small molecules',
  447. },
  448. 'ethanol': {
  449. 'database': 'tudataset',
  450. 'reference': '[36]',
  451. 'dataset_size': 455093,
  452. 'class_number': None,
  453. 'task_type': 'regression',
  454. 'ave_node_num': 9.0,
  455. 'ave_edge_num': 36.0,
  456. 'node_labeled': True,
  457. 'edge_labeled': False,
  458. 'node_attr_dim': 6,
  459. 'geometry': '3D, RI',
  460. 'edge_attr_dim': 0,
  461. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ethanol.zip',
  462. 'domain': 'small molecules',
  463. },
  464. 'FRANKENSTEIN': {
  465. 'database': 'tudataset',
  466. 'reference': '[15]',
  467. 'dataset_size': 4337,
  468. 'class_number': 2,
  469. 'task_type': 'classification',
  470. 'ave_node_num': 16.9,
  471. 'ave_edge_num': 17.88,
  472. 'node_labeled': False,
  473. 'edge_labeled': False,
  474. 'node_attr_dim': 780,
  475. 'geometry': None,
  476. 'edge_attr_dim': 0,
  477. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/FRANKENSTEIN.zip',
  478. 'domain': 'small molecules',
  479. },
  480. 'malonaldehyde': {
  481. 'database': 'tudataset',
  482. 'reference': '[36]',
  483. 'dataset_size': 893238,
  484. 'class_number': None,
  485. 'task_type': 'regression',
  486. 'ave_node_num': 9.0,
  487. 'ave_edge_num': 36.0,
  488. 'node_labeled': True,
  489. 'edge_labeled': False,
  490. 'node_attr_dim': 6,
  491. 'geometry': '3D, RI',
  492. 'edge_attr_dim': 0,
  493. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/malonaldehyde.zip',
  494. 'domain': 'small molecules',
  495. },
  496. 'MCF-7': {
  497. 'database': 'tudataset',
  498. 'reference': '[28]',
  499. 'dataset_size': 27770,
  500. 'class_number': 2,
  501. 'task_type': 'classification',
  502. 'ave_node_num': 26.39,
  503. 'ave_edge_num': 28.52,
  504. 'node_labeled': True,
  505. 'edge_labeled': True,
  506. 'node_attr_dim': 0,
  507. 'geometry': None,
  508. 'edge_attr_dim': 0,
  509. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MCF-7.zip',
  510. 'domain': 'small molecules',
  511. },
  512. 'MCF-7H': {
  513. 'database': 'tudataset',
  514. 'reference': '[28]',
  515. 'dataset_size': 27770,
  516. 'class_number': 2,
  517. 'task_type': 'classification',
  518. 'ave_node_num': 47.3,
  519. 'ave_edge_num': 49.43,
  520. 'node_labeled': True,
  521. 'edge_labeled': True,
  522. 'node_attr_dim': 0,
  523. 'geometry': None,
  524. 'edge_attr_dim': 0,
  525. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MCF-7H.zip',
  526. 'domain': 'small molecules',
  527. },
  528. 'MOLT-4': {
  529. 'database': 'tudataset',
  530. 'reference': '[28]',
  531. 'dataset_size': 39765,
  532. 'class_number': 2,
  533. 'task_type': 'classification',
  534. 'ave_node_num': 26.09,
  535. 'ave_edge_num': 28.13,
  536. 'node_labeled': True,
  537. 'edge_labeled': True,
  538. 'node_attr_dim': 0,
  539. 'geometry': None,
  540. 'edge_attr_dim': 0,
  541. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MOLT-4.zip',
  542. 'domain': 'small molecules',
  543. },
  544. 'MOLT-4H': {
  545. 'database': 'tudataset',
  546. 'reference': '[28]',
  547. 'dataset_size': 39765,
  548. 'class_number': 2,
  549. 'task_type': 'classification',
  550. 'ave_node_num': 46.7,
  551. 'ave_edge_num': 48.73,
  552. 'node_labeled': True,
  553. 'edge_labeled': True,
  554. 'node_attr_dim': 0,
  555. 'geometry': None,
  556. 'edge_attr_dim': 0,
  557. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MOLT-4H.zip',
  558. 'domain': 'small molecules',
  559. },
  560. 'Mutagenicity': {
  561. 'database': 'tudataset',
  562. 'reference': '[16,20]',
  563. 'dataset_size': 4337,
  564. 'class_number': 2,
  565. 'task_type': 'classification',
  566. 'ave_node_num': 30.32,
  567. 'ave_edge_num': 30.77,
  568. 'node_labeled': True,
  569. 'edge_labeled': True,
  570. 'node_attr_dim': 0,
  571. 'geometry': None,
  572. 'edge_attr_dim': 0,
  573. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Mutagenicity.zip',
  574. 'domain': 'small molecules',
  575. },
  576. 'MUTAG': {
  577. 'database': 'tudataset',
  578. 'reference': '[1,23]',
  579. 'dataset_size': 188,
  580. 'class_number': 2,
  581. 'task_type': 'classification',
  582. 'ave_node_num': 17.93,
  583. 'ave_edge_num': 19.79,
  584. 'node_labeled': True,
  585. 'edge_labeled': True,
  586. 'node_attr_dim': 0,
  587. 'geometry': None,
  588. 'edge_attr_dim': 0,
  589. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MUTAG.zip',
  590. 'domain': 'small molecules',
  591. },
  592. 'naphthalene': {
  593. 'database': 'tudataset',
  594. 'reference': '[36]',
  595. 'dataset_size': 226256,
  596. 'class_number': None,
  597. 'task_type': 'regression',
  598. 'ave_node_num': 18.0,
  599. 'ave_edge_num': 127.37,
  600. 'node_labeled': True,
  601. 'edge_labeled': False,
  602. 'node_attr_dim': 6,
  603. 'geometry': '3D, RI',
  604. 'edge_attr_dim': 0,
  605. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/naphthalene.zip',
  606. 'domain': 'small molecules',
  607. },
  608. 'NCI1': {
  609. 'database': 'tudataset',
  610. 'reference': '[8,9,22]',
  611. 'dataset_size': 4110,
  612. 'class_number': 2,
  613. 'task_type': 'classification',
  614. 'ave_node_num': 29.87,
  615. 'ave_edge_num': 32.3,
  616. 'node_labeled': True,
  617. 'edge_labeled': False,
  618. 'node_attr_dim': 0,
  619. 'geometry': None,
  620. 'edge_attr_dim': 0,
  621. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI1.zip',
  622. 'domain': 'small molecules',
  623. },
  624. 'NCI109': {
  625. 'database': 'tudataset',
  626. 'reference': '[8,9,22]',
  627. 'dataset_size': 4127,
  628. 'class_number': 2,
  629. 'task_type': 'classification',
  630. 'ave_node_num': 29.68,
  631. 'ave_edge_num': 32.13,
  632. 'node_labeled': True,
  633. 'edge_labeled': False,
  634. 'node_attr_dim': 0,
  635. 'geometry': None,
  636. 'edge_attr_dim': 0,
  637. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI109.zip',
  638. 'domain': 'small molecules',
  639. },
  640. 'NCI-H23': {
  641. 'database': 'tudataset',
  642. 'reference': '[28]',
  643. 'dataset_size': 40353,
  644. 'class_number': 2,
  645. 'task_type': 'classification',
  646. 'ave_node_num': 26.07,
  647. 'ave_edge_num': 28.1,
  648. 'node_labeled': True,
  649. 'edge_labeled': True,
  650. 'node_attr_dim': 0,
  651. 'geometry': None,
  652. 'edge_attr_dim': 0,
  653. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI-H23.zip',
  654. 'domain': 'small molecules',
  655. },
  656. 'NCI-H23H': {
  657. 'database': 'tudataset',
  658. 'reference': '[28]',
  659. 'dataset_size': 40353,
  660. 'class_number': 2,
  661. 'task_type': 'classification',
  662. 'ave_node_num': 46.67,
  663. 'ave_edge_num': 48.69,
  664. 'node_labeled': True,
  665. 'edge_labeled': True,
  666. 'node_attr_dim': 0,
  667. 'geometry': None,
  668. 'edge_attr_dim': 0,
  669. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI-H23H.zip',
  670. 'domain': 'small molecules',
  671. },
  672. 'OVCAR-8': {
  673. 'database': 'tudataset',
  674. 'reference': '[28]',
  675. 'dataset_size': 40516,
  676. 'class_number': 2,
  677. 'task_type': 'classification',
  678. 'ave_node_num': 26.07,
  679. 'ave_edge_num': 28.1,
  680. 'node_labeled': True,
  681. 'edge_labeled': True,
  682. 'node_attr_dim': 0,
  683. 'geometry': None,
  684. 'edge_attr_dim': 0,
  685. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OVCAR-8.zip',
  686. 'domain': 'small molecules',
  687. },
  688. 'OVCAR-8H': {
  689. 'database': 'tudataset',
  690. 'reference': '[28]',
  691. 'dataset_size': 40516,
  692. 'class_number': 2,
  693. 'task_type': 'classification',
  694. 'ave_node_num': 46.67,
  695. 'ave_edge_num': 48.7,
  696. 'node_labeled': True,
  697. 'edge_labeled': True,
  698. 'node_attr_dim': 0,
  699. 'geometry': None,
  700. 'edge_attr_dim': 0,
  701. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OVCAR-8H.zip',
  702. 'domain': 'small molecules',
  703. },
  704. 'P388': {
  705. 'database': 'tudataset',
  706. 'reference': '[28]',
  707. 'dataset_size': 41472,
  708. 'class_number': 2,
  709. 'task_type': 'classification',
  710. 'ave_node_num': 22.11,
  711. 'ave_edge_num': 23.55,
  712. 'node_labeled': True,
  713. 'edge_labeled': True,
  714. 'node_attr_dim': 0,
  715. 'geometry': None,
  716. 'edge_attr_dim': 0,
  717. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/P388.zip',
  718. 'domain': 'small molecules',
  719. },
  720. 'P388H': {
  721. 'database': 'tudataset',
  722. 'reference': '[28]',
  723. 'dataset_size': 41472,
  724. 'class_number': 2,
  725. 'task_type': 'classification',
  726. 'ave_node_num': 40.44,
  727. 'ave_edge_num': 41.88,
  728. 'node_labeled': True,
  729. 'edge_labeled': True,
  730. 'node_attr_dim': 0,
  731. 'geometry': None,
  732. 'edge_attr_dim': 0,
  733. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/P388H.zip',
  734. 'domain': 'small molecules',
  735. },
  736. 'PC-3': {
  737. 'database': 'tudataset',
  738. 'reference': '[28]',
  739. 'dataset_size': 27509,
  740. 'class_number': 2,
  741. 'task_type': 'classification',
  742. 'ave_node_num': 26.35,
  743. 'ave_edge_num': 28.49,
  744. 'node_labeled': True,
  745. 'edge_labeled': True,
  746. 'node_attr_dim': 0,
  747. 'geometry': None,
  748. 'edge_attr_dim': 0,
  749. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PC-3.zip',
  750. 'domain': 'small molecules',
  751. },
  752. 'PC-3H': {
  753. 'database': 'tudataset',
  754. 'reference': '[28]',
  755. 'dataset_size': 27509,
  756. 'class_number': 2,
  757. 'task_type': 'classification',
  758. 'ave_node_num': 47.19,
  759. 'ave_edge_num': 49.32,
  760. 'node_labeled': True,
  761. 'edge_labeled': True,
  762. 'node_attr_dim': 0,
  763. 'geometry': None,
  764. 'edge_attr_dim': 0,
  765. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PC-3H.zip',
  766. 'domain': 'small molecules',
  767. },
  768. 'PTC_FM': {
  769. 'database': 'tudataset',
  770. 'reference': '[2,23]',
  771. 'dataset_size': 349,
  772. 'class_number': 2,
  773. 'task_type': 'classification',
  774. 'ave_node_num': 14.11,
  775. 'ave_edge_num': 14.48,
  776. 'node_labeled': True,
  777. 'edge_labeled': True,
  778. 'node_attr_dim': 0,
  779. 'geometry': None,
  780. 'edge_attr_dim': 0,
  781. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_FM.zip',
  782. 'domain': 'small molecules',
  783. },
  784. 'PTC_FR': {
  785. 'database': 'tudataset',
  786. 'reference': '[2,23]',
  787. 'dataset_size': 351,
  788. 'class_number': 2,
  789. 'task_type': 'classification',
  790. 'ave_node_num': 14.56,
  791. 'ave_edge_num': 15.0,
  792. 'node_labeled': True,
  793. 'edge_labeled': True,
  794. 'node_attr_dim': 0,
  795. 'geometry': None,
  796. 'edge_attr_dim': 0,
  797. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_FR.zip',
  798. 'domain': 'small molecules',
  799. },
  800. 'PTC_MM': {
  801. 'database': 'tudataset',
  802. 'reference': '[2,23]',
  803. 'dataset_size': 336,
  804. 'class_number': 2,
  805. 'task_type': 'classification',
  806. 'ave_node_num': 13.97,
  807. 'ave_edge_num': 14.32,
  808. 'node_labeled': True,
  809. 'edge_labeled': True,
  810. 'node_attr_dim': 0,
  811. 'geometry': None,
  812. 'edge_attr_dim': 0,
  813. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_MM.zip',
  814. 'domain': 'small molecules',
  815. },
  816. 'PTC_MR': {
  817. 'database': 'tudataset',
  818. 'reference': '[2,23]',
  819. 'dataset_size': 344,
  820. 'class_number': 2,
  821. 'task_type': 'classification',
  822. 'ave_node_num': 14.29,
  823. 'ave_edge_num': 14.69,
  824. 'node_labeled': True,
  825. 'edge_labeled': True,
  826. 'node_attr_dim': 0,
  827. 'geometry': None,
  828. 'edge_attr_dim': 0,
  829. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_MR.zip',
  830. 'domain': 'small molecules',
  831. },
  832. 'QM9': {
  833. 'database': 'tudataset',
  834. 'reference': '[33,34,35]',
  835. 'dataset_size': 129433,
  836. 'class_number': None,
  837. 'task_type': 'regression',
  838. 'ave_node_num': 18.03,
  839. 'ave_edge_num': 18.63,
  840. 'node_labeled': False,
  841. 'edge_labeled': False,
  842. 'node_attr_dim': 16,
  843. 'geometry': '3D, RI',
  844. 'edge_attr_dim': 4,
  845. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/QM9.zip',
  846. 'domain': 'small molecules',
  847. },
  848. 'salicylic_acid': {
  849. 'database': 'tudataset',
  850. 'reference': '[36]',
  851. 'dataset_size': 220232,
  852. 'class_number': None,
  853. 'task_type': 'regression',
  854. 'ave_node_num': 16.0,
  855. 'ave_edge_num': 104.13,
  856. 'node_labeled': True,
  857. 'edge_labeled': False,
  858. 'node_attr_dim': 6,
  859. 'geometry': '3D, RI',
  860. 'edge_attr_dim': 0,
  861. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/salicylic_acid.zip',
  862. 'domain': 'small molecules',
  863. },
  864. 'SF-295': {
  865. 'database': 'tudataset',
  866. 'reference': '[28]',
  867. 'dataset_size': 40271,
  868. 'class_number': 2,
  869. 'task_type': 'classification',
  870. 'ave_node_num': 26.06,
  871. 'ave_edge_num': 28.08,
  872. 'node_labeled': True,
  873. 'edge_labeled': True,
  874. 'node_attr_dim': 0,
  875. 'geometry': None,
  876. 'edge_attr_dim': 0,
  877. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SF-295.zip',
  878. 'domain': 'small molecules',
  879. },
  880. 'SF-295H': {
  881. 'database': 'tudataset',
  882. 'reference': '[28]',
  883. 'dataset_size': 40271,
  884. 'class_number': 2,
  885. 'task_type': 'classification',
  886. 'ave_node_num': 46.65,
  887. 'ave_edge_num': 48.68,
  888. 'node_labeled': True,
  889. 'edge_labeled': True,
  890. 'node_attr_dim': 0,
  891. 'geometry': None,
  892. 'edge_attr_dim': 0,
  893. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SF-295H.zip',
  894. 'domain': 'small molecules',
  895. },
  896. 'SN12C': {
  897. 'database': 'tudataset',
  898. 'reference': '[28]',
  899. 'dataset_size': 40004,
  900. 'class_number': 2,
  901. 'task_type': 'classification',
  902. 'ave_node_num': 26.08,
  903. 'ave_edge_num': 28.11,
  904. 'node_labeled': True,
  905. 'edge_labeled': True,
  906. 'node_attr_dim': 0,
  907. 'geometry': None,
  908. 'edge_attr_dim': 0,
  909. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SN12C.zip',
  910. 'domain': 'small molecules',
  911. },
  912. 'SN12CH': {
  913. 'database': 'tudataset',
  914. 'reference': '[28]',
  915. 'dataset_size': 40004,
  916. 'class_number': 2,
  917. 'task_type': 'classification',
  918. 'ave_node_num': 46.69,
  919. 'ave_edge_num': 48.71,
  920. 'node_labeled': True,
  921. 'edge_labeled': True,
  922. 'node_attr_dim': 0,
  923. 'geometry': None,
  924. 'edge_attr_dim': 0,
  925. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SN12CH.zip',
  926. 'domain': 'small molecules',
  927. },
  928. 'SW-620': {
  929. 'database': 'tudataset',
  930. 'reference': '[28]',
  931. 'dataset_size': 40532,
  932. 'class_number': 2,
  933. 'task_type': 'classification',
  934. 'ave_node_num': 26.05,
  935. 'ave_edge_num': 28.08,
  936. 'node_labeled': True,
  937. 'edge_labeled': True,
  938. 'node_attr_dim': 0,
  939. 'geometry': None,
  940. 'edge_attr_dim': 0,
  941. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SW-620.zip',
  942. 'domain': 'small molecules',
  943. },
  944. 'SW-620H': {
  945. 'database': 'tudataset',
  946. 'reference': '[28]',
  947. 'dataset_size': 40532,
  948. 'class_number': 2,
  949. 'task_type': 'classification',
  950. 'ave_node_num': 46.62,
  951. 'ave_edge_num': 48.65,
  952. 'node_labeled': True,
  953. 'edge_labeled': True,
  954. 'node_attr_dim': 0,
  955. 'geometry': None,
  956. 'edge_attr_dim': 0,
  957. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SW-620H.zip',
  958. 'domain': 'small molecules',
  959. },
  960. 'toluene': {
  961. 'database': 'tudataset',
  962. 'reference': '[36]',
  963. 'dataset_size': 342791,
  964. 'class_number': None,
  965. 'task_type': 'regression',
  966. 'ave_node_num': 15.0,
  967. 'ave_edge_num': 96.15,
  968. 'node_labeled': True,
  969. 'edge_labeled': False,
  970. 'node_attr_dim': 6,
  971. 'geometry': '3D, RI',
  972. 'edge_attr_dim': 0,
  973. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/toluene.zip',
  974. 'domain': 'small molecules',
  975. },
  976. 'Tox21_AhR_training': {
  977. 'database': 'tudataset',
  978. 'reference': '[24]',
  979. 'dataset_size': 8169,
  980. 'class_number': 2,
  981. 'task_type': 'classification',
  982. 'ave_node_num': 18.09,
  983. 'ave_edge_num': 18.5,
  984. 'node_labeled': True,
  985. 'edge_labeled': True,
  986. 'node_attr_dim': 0,
  987. 'geometry': None,
  988. 'edge_attr_dim': 0,
  989. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_training.zip',
  990. 'domain': 'small molecules',
  991. },
  992. 'Tox21_AhR_testing': {
  993. 'database': 'tudataset',
  994. 'reference': '[24]',
  995. 'dataset_size': 272,
  996. 'class_number': 2,
  997. 'task_type': 'classification',
  998. 'ave_node_num': 22.13,
  999. 'ave_edge_num': 23.05,
  1000. 'node_labeled': True,
  1001. 'edge_labeled': True,
  1002. 'node_attr_dim': 0,
  1003. 'geometry': None,
  1004. 'edge_attr_dim': 0,
  1005. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_testing.zip',
  1006. 'domain': 'small molecules',
  1007. },
  1008. 'Tox21_AhR_evaluation': {
  1009. 'database': 'tudataset',
  1010. 'reference': '[24]',
  1011. 'dataset_size': 607,
  1012. 'class_number': 2,
  1013. 'task_type': 'classification',
  1014. 'ave_node_num': 17.64,
  1015. 'ave_edge_num': 18.06,
  1016. 'node_labeled': True,
  1017. 'edge_labeled': True,
  1018. 'node_attr_dim': 0,
  1019. 'geometry': None,
  1020. 'edge_attr_dim': 0,
  1021. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_evaluation.zip',
  1022. 'domain': 'small molecules',
  1023. },
  1024. 'Tox21_AR_training': {
  1025. 'database': 'tudataset',
  1026. 'reference': '[24]',
  1027. 'dataset_size': 9362,
  1028. 'class_number': 2,
  1029. 'task_type': 'classification',
  1030. 'ave_node_num': 18.39,
  1031. 'ave_edge_num': 18.84,
  1032. 'node_labeled': True,
  1033. 'edge_labeled': True,
  1034. 'node_attr_dim': 0,
  1035. 'geometry': None,
  1036. 'edge_attr_dim': 0,
  1037. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_training.zip',
  1038. 'domain': 'small molecules',
  1039. },
  1040. 'Tox21_AR_testing': {
  1041. 'database': 'tudataset',
  1042. 'reference': '[24]',
  1043. 'dataset_size': 292,
  1044. 'class_number': 2,
  1045. 'task_type': 'classification',
  1046. 'ave_node_num': 22.35,
  1047. 'ave_edge_num': 23.32,
  1048. 'node_labeled': True,
  1049. 'edge_labeled': True,
  1050. 'node_attr_dim': 0,
  1051. 'geometry': None,
  1052. 'edge_attr_dim': 0,
  1053. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_testing.zip',
  1054. 'domain': 'small molecules',
  1055. },
  1056. 'Tox21_AR_evaluation': {
  1057. 'database': 'tudataset',
  1058. 'reference': '[24]',
  1059. 'dataset_size': 585,
  1060. 'class_number': 2,
  1061. 'task_type': 'classification',
  1062. 'ave_node_num': 17.99,
  1063. 'ave_edge_num': 18.45,
  1064. 'node_labeled': True,
  1065. 'edge_labeled': True,
  1066. 'node_attr_dim': 0,
  1067. 'geometry': None,
  1068. 'edge_attr_dim': 0,
  1069. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_evaluation.zip',
  1070. 'domain': 'small molecules',
  1071. },
  1072. 'Tox21_AR-LBD_training': {
  1073. 'database': 'tudataset',
  1074. 'reference': '[24]',
  1075. 'dataset_size': 8599,
  1076. 'class_number': 2,
  1077. 'task_type': 'classification',
  1078. 'ave_node_num': 17.77,
  1079. 'ave_edge_num': 18.16,
  1080. 'node_labeled': True,
  1081. 'edge_labeled': True,
  1082. 'node_attr_dim': 0,
  1083. 'geometry': None,
  1084. 'edge_attr_dim': 0,
  1085. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_training.zip',
  1086. 'domain': 'small molecules',
  1087. },
  1088. 'Tox21_AR-LBD_testing': {
  1089. 'database': 'tudataset',
  1090. 'reference': '[24]',
  1091. 'dataset_size': 253,
  1092. 'class_number': 2,
  1093. 'task_type': 'classification',
  1094. 'ave_node_num': 21.85,
  1095. 'ave_edge_num': 22.73,
  1096. 'node_labeled': True,
  1097. 'edge_labeled': True,
  1098. 'node_attr_dim': 0,
  1099. 'geometry': None,
  1100. 'edge_attr_dim': 0,
  1101. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_testing.zip',
  1102. 'domain': 'small molecules',
  1103. },
  1104. 'Tox21_AR-LBD_evaluation': {
  1105. 'database': 'tudataset',
  1106. 'reference': '[24]',
  1107. 'dataset_size': 580,
  1108. 'class_number': 2,
  1109. 'task_type': 'classification',
  1110. 'ave_node_num': 17.09,
  1111. 'ave_edge_num': 17.42,
  1112. 'node_labeled': True,
  1113. 'edge_labeled': True,
  1114. 'node_attr_dim': 0,
  1115. 'geometry': None,
  1116. 'edge_attr_dim': 0,
  1117. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_evaluation.zip',
  1118. 'domain': 'small molecules',
  1119. },
  1120. 'Tox21_ARE_training': {
  1121. 'database': 'tudataset',
  1122. 'reference': '[24]',
  1123. 'dataset_size': 7167,
  1124. 'class_number': 2,
  1125. 'task_type': 'classification',
  1126. 'ave_node_num': 16.28,
  1127. 'ave_edge_num': 16.52,
  1128. 'node_labeled': True,
  1129. 'edge_labeled': True,
  1130. 'node_attr_dim': 0,
  1131. 'geometry': None,
  1132. 'edge_attr_dim': 0,
  1133. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_training.zip',
  1134. 'domain': 'small molecules',
  1135. },
  1136. 'Tox21_ARE_testing': {
  1137. 'database': 'tudataset',
  1138. 'reference': '[24]',
  1139. 'dataset_size': 234,
  1140. 'class_number': 2,
  1141. 'task_type': 'classification',
  1142. 'ave_node_num': 21.99,
  1143. 'ave_edge_num': 22.91,
  1144. 'node_labeled': True,
  1145. 'edge_labeled': True,
  1146. 'node_attr_dim': 0,
  1147. 'geometry': None,
  1148. 'edge_attr_dim': 0,
  1149. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_testing.zip',
  1150. 'domain': 'small molecules',
  1151. },
  1152. 'Tox21_ARE_evaluation': {
  1153. 'database': 'tudataset',
  1154. 'reference': '[24]',
  1155. 'dataset_size': 552,
  1156. 'class_number': 2,
  1157. 'task_type': 'classification',
  1158. 'ave_node_num': 17.01,
  1159. 'ave_edge_num': 17.33,
  1160. 'node_labeled': True,
  1161. 'edge_labeled': True,
  1162. 'node_attr_dim': 0,
  1163. 'geometry': None,
  1164. 'edge_attr_dim': 0,
  1165. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_evaluation.zip',
  1166. 'domain': 'small molecules',
  1167. },
  1168. 'Tox21_aromatase_training': {
  1169. 'database': 'tudataset',
  1170. 'reference': '[24]',
  1171. 'dataset_size': 7226,
  1172. 'class_number': 2,
  1173. 'task_type': 'classification',
  1174. 'ave_node_num': 17.5,
  1175. 'ave_edge_num': 17.79,
  1176. 'node_labeled': True,
  1177. 'edge_labeled': True,
  1178. 'node_attr_dim': 0,
  1179. 'geometry': None,
  1180. 'edge_attr_dim': 0,
  1181. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_training.zip',
  1182. 'domain': 'small molecules',
  1183. },
  1184. 'Tox21_aromatase_testing': {
  1185. 'database': 'tudataset',
  1186. 'reference': '[24]',
  1187. 'dataset_size': 214,
  1188. 'class_number': 2,
  1189. 'task_type': 'classification',
  1190. 'ave_node_num': 21.65,
  1191. 'ave_edge_num': 22.36,
  1192. 'node_labeled': True,
  1193. 'edge_labeled': True,
  1194. 'node_attr_dim': 0,
  1195. 'geometry': None,
  1196. 'edge_attr_dim': 0,
  1197. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_testing.zip',
  1198. 'domain': 'small molecules',
  1199. },
  1200. 'Tox21_aromatase_evaluation': {
  1201. 'database': 'tudataset',
  1202. 'reference': '[24]',
  1203. 'dataset_size': 528,
  1204. 'class_number': 2,
  1205. 'task_type': 'classification',
  1206. 'ave_node_num': 16.74,
  1207. 'ave_edge_num': 16.99,
  1208. 'node_labeled': True,
  1209. 'edge_labeled': True,
  1210. 'node_attr_dim': 0,
  1211. 'geometry': None,
  1212. 'edge_attr_dim': 0,
  1213. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_evaluation.zip',
  1214. 'domain': 'small molecules',
  1215. },
  1216. 'Tox21_ATAD5_training': {
  1217. 'database': 'tudataset',
  1218. 'reference': '[24]',
  1219. 'dataset_size': 9091,
  1220. 'class_number': 2,
  1221. 'task_type': 'classification',
  1222. 'ave_node_num': 17.89,
  1223. 'ave_edge_num': 18.3,
  1224. 'node_labeled': True,
  1225. 'edge_labeled': True,
  1226. 'node_attr_dim': 0,
  1227. 'geometry': None,
  1228. 'edge_attr_dim': 0,
  1229. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_training.zip',
  1230. 'domain': 'small molecules',
  1231. },
  1232. 'Tox21_ATAD5_testing': {
  1233. 'database': 'tudataset',
  1234. 'reference': '[24]',
  1235. 'dataset_size': 272,
  1236. 'class_number': 2,
  1237. 'task_type': 'classification',
  1238. 'ave_node_num': 21.99,
  1239. 'ave_edge_num': 22.89,
  1240. 'node_labeled': True,
  1241. 'edge_labeled': True,
  1242. 'node_attr_dim': 0,
  1243. 'geometry': None,
  1244. 'edge_attr_dim': 0,
  1245. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_testing.zip',
  1246. 'domain': 'small molecules',
  1247. },
  1248. 'Tox21_ATAD5_evaluation': {
  1249. 'database': 'tudataset',
  1250. 'reference': '[24]',
  1251. 'dataset_size': 619,
  1252. 'class_number': 2,
  1253. 'task_type': 'classification',
  1254. 'ave_node_num': 17.68,
  1255. 'ave_edge_num': 18.11,
  1256. 'node_labeled': True,
  1257. 'edge_labeled': True,
  1258. 'node_attr_dim': 0,
  1259. 'geometry': None,
  1260. 'edge_attr_dim': 0,
  1261. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_evaluation.zip',
  1262. 'domain': 'small molecules',
  1263. },
  1264. 'Tox21_ER_training': {
  1265. 'database': 'tudataset',
  1266. 'reference': '[24]',
  1267. 'dataset_size': 7697,
  1268. 'class_number': 2,
  1269. 'task_type': 'classification',
  1270. 'ave_node_num': 17.58,
  1271. 'ave_edge_num': 17.94,
  1272. 'node_labeled': True,
  1273. 'edge_labeled': True,
  1274. 'node_attr_dim': 0,
  1275. 'geometry': None,
  1276. 'edge_attr_dim': 0,
  1277. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_training.zip',
  1278. 'domain': 'small molecules',
  1279. },
  1280. 'Tox21_ER_testing': {
  1281. 'database': 'tudataset',
  1282. 'reference': '[24]',
  1283. 'dataset_size': 265,
  1284. 'class_number': 2,
  1285. 'task_type': 'classification',
  1286. 'ave_node_num': 22.16,
  1287. 'ave_edge_num': 23.13,
  1288. 'node_labeled': True,
  1289. 'edge_labeled': True,
  1290. 'node_attr_dim': 0,
  1291. 'geometry': None,
  1292. 'edge_attr_dim': 0,
  1293. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_testing.zip',
  1294. 'domain': 'small molecules',
  1295. },
  1296. 'Tox21_ER_evaluation': {
  1297. 'database': 'tudataset',
  1298. 'reference': '[24]',
  1299. 'dataset_size': 515,
  1300. 'class_number': 2,
  1301. 'task_type': 'classification',
  1302. 'ave_node_num': 17.66,
  1303. 'ave_edge_num': 18.1,
  1304. 'node_labeled': True,
  1305. 'edge_labeled': True,
  1306. 'node_attr_dim': 0,
  1307. 'geometry': None,
  1308. 'edge_attr_dim': 0,
  1309. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_evaluation.zip',
  1310. 'domain': 'small molecules',
  1311. },
  1312. 'Tox21_ER-LBD_training': {
  1313. 'database': 'tudataset',
  1314. 'reference': '[24]',
  1315. 'dataset_size': 8753,
  1316. 'class_number': 2,
  1317. 'task_type': 'classification',
  1318. 'ave_node_num': 18.06,
  1319. 'ave_edge_num': 18.47,
  1320. 'node_labeled': True,
  1321. 'edge_labeled': True,
  1322. 'node_attr_dim': 0,
  1323. 'geometry': None,
  1324. 'edge_attr_dim': 0,
  1325. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_training.zip',
  1326. 'domain': 'small molecules',
  1327. },
  1328. 'Tox21_ER-LBD_testing': {
  1329. 'database': 'tudataset',
  1330. 'reference': '[24]',
  1331. 'dataset_size': 287,
  1332. 'class_number': 2,
  1333. 'task_type': 'classification',
  1334. 'ave_node_num': 22.28,
  1335. 'ave_edge_num': 23.23,
  1336. 'node_labeled': True,
  1337. 'edge_labeled': True,
  1338. 'node_attr_dim': 0,
  1339. 'geometry': None,
  1340. 'edge_attr_dim': 0,
  1341. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_testing.zip',
  1342. 'domain': 'small molecules',
  1343. },
  1344. 'Tox21_ER-LBD_evaluation': {
  1345. 'database': 'tudataset',
  1346. 'reference': '[24]',
  1347. 'dataset_size': 599,
  1348. 'class_number': 2,
  1349. 'task_type': 'classification',
  1350. 'ave_node_num': 17.75,
  1351. 'ave_edge_num': 18.17,
  1352. 'node_labeled': True,
  1353. 'edge_labeled': True,
  1354. 'node_attr_dim': 0,
  1355. 'geometry': None,
  1356. 'edge_attr_dim': 0,
  1357. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_evaluation.zip',
  1358. 'domain': 'small molecules',
  1359. },
  1360. 'Tox21_HSE_training': {
  1361. 'database': 'tudataset',
  1362. 'reference': '[24]',
  1363. 'dataset_size': 8150,
  1364. 'class_number': 2,
  1365. 'task_type': 'classification',
  1366. 'ave_node_num': 16.72,
  1367. 'ave_edge_num': 17.04,
  1368. 'node_labeled': True,
  1369. 'edge_labeled': True,
  1370. 'node_attr_dim': 0,
  1371. 'geometry': None,
  1372. 'edge_attr_dim': 0,
  1373. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_training.zip',
  1374. 'domain': 'small molecules',
  1375. },
  1376. 'Tox21_HSE_testing': {
  1377. 'database': 'tudataset',
  1378. 'reference': '[24]',
  1379. 'dataset_size': 267,
  1380. 'class_number': 2,
  1381. 'task_type': 'classification',
  1382. 'ave_node_num': 22.07,
  1383. 'ave_edge_num': 23.0,
  1384. 'node_labeled': True,
  1385. 'edge_labeled': True,
  1386. 'node_attr_dim': 0,
  1387. 'geometry': None,
  1388. 'edge_attr_dim': 0,
  1389. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_testing.zip',
  1390. 'domain': 'small molecules',
  1391. },
  1392. 'Tox21_HSE_evaluation': {
  1393. 'database': 'tudataset',
  1394. 'reference': '[24]',
  1395. 'dataset_size': 607,
  1396. 'class_number': 2,
  1397. 'task_type': 'classification',
  1398. 'ave_node_num': 17.61,
  1399. 'ave_edge_num': 18.01,
  1400. 'node_labeled': True,
  1401. 'edge_labeled': True,
  1402. 'node_attr_dim': 0,
  1403. 'geometry': None,
  1404. 'edge_attr_dim': 0,
  1405. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_evaluation.zip',
  1406. 'domain': 'small molecules',
  1407. },
  1408. 'Tox21_MMP_training': {
  1409. 'database': 'tudataset',
  1410. 'reference': '[24]',
  1411. 'dataset_size': 7320,
  1412. 'class_number': 2,
  1413. 'task_type': 'classification',
  1414. 'ave_node_num': 17.49,
  1415. 'ave_edge_num': 17.83,
  1416. 'node_labeled': True,
  1417. 'edge_labeled': True,
  1418. 'node_attr_dim': 0,
  1419. 'geometry': None,
  1420. 'edge_attr_dim': 0,
  1421. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_training.zip',
  1422. 'domain': 'small molecules',
  1423. },
  1424. 'Tox21_MMP_testing': {
  1425. 'database': 'tudataset',
  1426. 'reference': '[24]',
  1427. 'dataset_size': 238,
  1428. 'class_number': 2,
  1429. 'task_type': 'classification',
  1430. 'ave_node_num': 21.68,
  1431. 'ave_edge_num': 22.55,
  1432. 'node_labeled': True,
  1433. 'edge_labeled': True,
  1434. 'node_attr_dim': 0,
  1435. 'geometry': None,
  1436. 'edge_attr_dim': 0,
  1437. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_testing.zip',
  1438. 'domain': 'small molecules',
  1439. },
  1440. 'Tox21_MMP_evaluation': {
  1441. 'database': 'tudataset',
  1442. 'reference': '[24]',
  1443. 'dataset_size': 541,
  1444. 'class_number': 2,
  1445. 'task_type': 'classification',
  1446. 'ave_node_num': 16.67,
  1447. 'ave_edge_num': 16.88,
  1448. 'node_labeled': True,
  1449. 'edge_labeled': True,
  1450. 'node_attr_dim': 0,
  1451. 'geometry': None,
  1452. 'edge_attr_dim': 0,
  1453. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_evaluation.zip',
  1454. 'domain': 'small molecules',
  1455. },
  1456. 'Tox21_p53_training': {
  1457. 'database': 'tudataset',
  1458. 'reference': '[24]',
  1459. 'dataset_size': 8634,
  1460. 'class_number': 2,
  1461. 'task_type': 'classification',
  1462. 'ave_node_num': 17.79,
  1463. 'ave_edge_num': 18.19,
  1464. 'node_labeled': True,
  1465. 'edge_labeled': True,
  1466. 'node_attr_dim': 0,
  1467. 'geometry': None,
  1468. 'edge_attr_dim': 0,
  1469. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_training.zip',
  1470. 'domain': 'small molecules',
  1471. },
  1472. 'Tox21_p53_testing': {
  1473. 'database': 'tudataset',
  1474. 'reference': '[24]',
  1475. 'dataset_size': 269,
  1476. 'class_number': 2,
  1477. 'task_type': 'classification',
  1478. 'ave_node_num': 22.14,
  1479. 'ave_edge_num': 23.04,
  1480. 'node_labeled': True,
  1481. 'edge_labeled': True,
  1482. 'node_attr_dim': 0,
  1483. 'geometry': None,
  1484. 'edge_attr_dim': 0,
  1485. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_testing.zip',
  1486. 'domain': 'small molecules',
  1487. },
  1488. 'Tox21_p53_evaluation': {
  1489. 'database': 'tudataset',
  1490. 'reference': '[24]',
  1491. 'dataset_size': 613,
  1492. 'class_number': 2,
  1493. 'task_type': 'classification',
  1494. 'ave_node_num': 17.34,
  1495. 'ave_edge_num': 17.72,
  1496. 'node_labeled': True,
  1497. 'edge_labeled': True,
  1498. 'node_attr_dim': 0,
  1499. 'geometry': None,
  1500. 'edge_attr_dim': 0,
  1501. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_evaluation.zip',
  1502. 'domain': 'small molecules',
  1503. },
  1504. 'Tox21_PPAR-gamma_training': {
  1505. 'database': 'tudataset',
  1506. 'reference': '[24]',
  1507. 'dataset_size': 8184,
  1508. 'class_number': 2,
  1509. 'task_type': 'classification',
  1510. 'ave_node_num': 17.23,
  1511. 'ave_edge_num': 17.55,
  1512. 'node_labeled': True,
  1513. 'edge_labeled': True,
  1514. 'node_attr_dim': 0,
  1515. 'geometry': None,
  1516. 'edge_attr_dim': 0,
  1517. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_training.zip',
  1518. 'domain': 'small molecules',
  1519. },
  1520. 'Tox21_PPAR-gamma_testing': {
  1521. 'database': 'tudataset',
  1522. 'reference': '[24]',
  1523. 'dataset_size': 267,
  1524. 'class_number': 2,
  1525. 'task_type': 'classification',
  1526. 'ave_node_num': 22.04,
  1527. 'ave_edge_num': 22.93,
  1528. 'node_labeled': True,
  1529. 'edge_labeled': True,
  1530. 'node_attr_dim': 0,
  1531. 'geometry': None,
  1532. 'edge_attr_dim': 0,
  1533. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_testing.zip',
  1534. 'domain': 'small molecules',
  1535. },
  1536. 'Tox21_PPAR-gamma_evaluation': {
  1537. 'database': 'tudataset',
  1538. 'reference': '[24]',
  1539. 'dataset_size': 602,
  1540. 'class_number': 2,
  1541. 'task_type': 'classification',
  1542. 'ave_node_num': 17.38,
  1543. 'ave_edge_num': 17.77,
  1544. 'node_labeled': True,
  1545. 'edge_labeled': True,
  1546. 'node_attr_dim': 0,
  1547. 'geometry': None,
  1548. 'edge_attr_dim': 0,
  1549. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_evaluation.zip',
  1550. 'domain': 'small molecules',
  1551. },
  1552. 'UACC257': {
  1553. 'database': 'tudataset',
  1554. 'reference': '[28]',
  1555. 'dataset_size': 39988,
  1556. 'class_number': 2,
  1557. 'task_type': 'classification',
  1558. 'ave_node_num': 26.09,
  1559. 'ave_edge_num': 28.12,
  1560. 'node_labeled': True,
  1561. 'edge_labeled': True,
  1562. 'node_attr_dim': 0,
  1563. 'geometry': None,
  1564. 'edge_attr_dim': 0,
  1565. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/UACC257.zip',
  1566. 'domain': 'small molecules',
  1567. },
  1568. 'UACC257H': {
  1569. 'database': 'tudataset',
  1570. 'reference': '[28]',
  1571. 'dataset_size': 39988,
  1572. 'class_number': 2,
  1573. 'task_type': 'classification',
  1574. 'ave_node_num': 46.68,
  1575. 'ave_edge_num': 48.71,
  1576. 'node_labeled': True,
  1577. 'edge_labeled': True,
  1578. 'node_attr_dim': 0,
  1579. 'geometry': None,
  1580. 'edge_attr_dim': 0,
  1581. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/UACC257H.zip',
  1582. 'domain': 'small molecules',
  1583. },
  1584. 'uracil': {
  1585. 'database': 'tudataset',
  1586. 'reference': '[36]',
  1587. 'dataset_size': 133770,
  1588. 'class_number': None,
  1589. 'task_type': 'regression',
  1590. 'ave_node_num': 12.0,
  1591. 'ave_edge_num': 64.44,
  1592. 'node_labeled': True,
  1593. 'edge_labeled': False,
  1594. 'node_attr_dim': 6,
  1595. 'geometry': '3D, RI',
  1596. 'edge_attr_dim': 0,
  1597. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/uracil.zip',
  1598. 'domain': 'small molecules',
  1599. },
  1600. 'Yeast': {
  1601. 'database': 'tudataset',
  1602. 'reference': '[28]',
  1603. 'dataset_size': 79601,
  1604. 'class_number': 2,
  1605. 'task_type': 'classification',
  1606. 'ave_node_num': 21.54,
  1607. 'ave_edge_num': 22.84,
  1608. 'node_labeled': True,
  1609. 'edge_labeled': True,
  1610. 'node_attr_dim': 0,
  1611. 'geometry': None,
  1612. 'edge_attr_dim': 0,
  1613. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Yeast.zip',
  1614. 'domain': 'small molecules',
  1615. },
  1616. 'YeastH': {
  1617. 'database': 'tudataset',
  1618. 'reference': '[28]',
  1619. 'dataset_size': 79601,
  1620. 'class_number': 2,
  1621. 'task_type': 'classification',
  1622. 'ave_node_num': 39.44,
  1623. 'ave_edge_num': 40.74,
  1624. 'node_labeled': True,
  1625. 'edge_labeled': True,
  1626. 'node_attr_dim': 0,
  1627. 'geometry': None,
  1628. 'edge_attr_dim': 0,
  1629. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/YeastH.zip',
  1630. 'domain': 'small molecules',
  1631. },
  1632. 'ZINC_full': {
  1633. 'database': 'tudataset',
  1634. 'reference': '[31]',
  1635. 'dataset_size': 249456,
  1636. 'class_number': None,
  1637. 'task_type': 'regression',
  1638. 'ave_node_num': 23.14,
  1639. 'ave_edge_num': 24.91,
  1640. 'node_labeled': True,
  1641. 'edge_labeled': True,
  1642. 'node_attr_dim': 0,
  1643. 'geometry': None,
  1644. 'edge_attr_dim': 0,
  1645. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_full.zip',
  1646. 'domain': 'small molecules',
  1647. },
  1648. 'ZINC_test': {
  1649. 'database': 'tudataset',
  1650. 'reference': '[31]',
  1651. 'dataset_size': 5000,
  1652. 'class_number': None,
  1653. 'task_type': 'regression',
  1654. 'ave_node_num': 23.1,
  1655. 'ave_edge_num': 24.83,
  1656. 'node_labeled': True,
  1657. 'edge_labeled': True,
  1658. 'node_attr_dim': 0,
  1659. 'geometry': None,
  1660. 'edge_attr_dim': 0,
  1661. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_test.zip',
  1662. 'domain': 'small molecules',
  1663. },
  1664. 'ZINC_train': {
  1665. 'database': 'tudataset',
  1666. 'reference': '[31]',
  1667. 'dataset_size': 220011,
  1668. 'class_number': None,
  1669. 'task_type': 'regression',
  1670. 'ave_node_num': 23.15,
  1671. 'ave_edge_num': 24.91,
  1672. 'node_labeled': True,
  1673. 'edge_labeled': True,
  1674. 'node_attr_dim': 0,
  1675. 'geometry': None,
  1676. 'edge_attr_dim': 0,
  1677. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_train.zip',
  1678. 'domain': 'small molecules',
  1679. },
  1680. 'ZINC_val': {
  1681. 'database': 'tudataset',
  1682. 'reference': '[31]',
  1683. 'dataset_size': 24445,
  1684. 'class_number': None,
  1685. 'task_type': 'regression',
  1686. 'ave_node_num': 23.13,
  1687. 'ave_edge_num': 24.88,
  1688. 'node_labeled': True,
  1689. 'edge_labeled': True,
  1690. 'node_attr_dim': 0,
  1691. 'geometry': None,
  1692. 'edge_attr_dim': 0,
  1693. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_val.zip',
  1694. 'domain': 'small molecules',
  1695. },
  1696. ### bioinformatics
  1697. 'DD': {
  1698. 'database': 'tudataset',
  1699. 'reference': '[6,22]',
  1700. 'dataset_size': 1178,
  1701. 'class_number': 2,
  1702. 'task_type': 'classification',
  1703. 'ave_node_num': 284.32,
  1704. 'ave_edge_num': 715.66,
  1705. 'node_labeled': True,
  1706. 'edge_labeled': False,
  1707. 'node_attr_dim': 0,
  1708. 'geometry': None,
  1709. 'edge_attr_dim': 0,
  1710. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DD.zip',
  1711. 'domain': 'bioinformatics',
  1712. },
  1713. 'ENZYMES': {
  1714. 'database': 'tudataset',
  1715. 'reference': '[4,5]',
  1716. 'dataset_size': 600,
  1717. 'class_number': 6,
  1718. 'task_type': 'classification',
  1719. 'ave_node_num': 32.63,
  1720. 'ave_edge_num': 62.14,
  1721. 'node_labeled': True,
  1722. 'edge_labeled': False,
  1723. 'node_attr_dim': 18,
  1724. 'geometry': None,
  1725. 'edge_attr_dim': 0,
  1726. 'url': 'http://www.chrsmrrs.com/graphkerneldatasets/ENZYMES.zip',
  1727. 'domain': 'bioinformatics',
  1728. },
  1729. 'KKI': {
  1730. 'database': 'tudataset',
  1731. 'reference': '[26]',
  1732. 'dataset_size': 83,
  1733. 'class_number': 2,
  1734. 'task_type': 'classification',
  1735. 'ave_node_num': 26.96,
  1736. 'ave_edge_num': 48.42,
  1737. 'node_labeled': True,
  1738. 'edge_labeled': False,
  1739. 'node_attr_dim': 0,
  1740. 'geometry': None,
  1741. 'edge_attr_dim': 0,
  1742. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/KKI.zip',
  1743. 'domain': 'bioinformatics',
  1744. },
  1745. 'OHSU': {
  1746. 'database': 'tudataset',
  1747. 'reference': '[26]',
  1748. 'dataset_size': 79,
  1749. 'class_number': 2,
  1750. 'task_type': 'classification',
  1751. 'ave_node_num': 82.01,
  1752. 'ave_edge_num': 199.66,
  1753. 'node_labeled': True,
  1754. 'edge_labeled': False,
  1755. 'node_attr_dim': 0,
  1756. 'geometry': None,
  1757. 'edge_attr_dim': 0,
  1758. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OHSU.zip',
  1759. 'domain': 'bioinformatics',
  1760. },
  1761. 'Peking_1': {
  1762. 'database': 'tudataset',
  1763. 'reference': '[26]',
  1764. 'dataset_size': 85,
  1765. 'class_number': 2,
  1766. 'task_type': 'classification',
  1767. 'ave_node_num': 39.31,
  1768. 'ave_edge_num': 77.35,
  1769. 'node_labeled': True,
  1770. 'edge_labeled': False,
  1771. 'node_attr_dim': 0,
  1772. 'geometry': None,
  1773. 'edge_attr_dim': 0,
  1774. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Peking_1.zip',
  1775. 'domain': 'bioinformatics',
  1776. },
  1777. 'PROTEINS': {
  1778. 'database': 'tudataset',
  1779. 'reference': '[4,6]',
  1780. 'dataset_size': 1113,
  1781. 'class_number': 2,
  1782. 'task_type': 'classification',
  1783. 'ave_node_num': 39.06,
  1784. 'ave_edge_num': 72.82,
  1785. 'node_labeled': True,
  1786. 'edge_labeled': False,
  1787. 'node_attr_dim': 1,
  1788. 'geometry': None,
  1789. 'edge_attr_dim': 0,
  1790. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PROTEINS.zip',
  1791. 'domain': 'bioinformatics',
  1792. },
  1793. 'PROTEINS_full': {
  1794. 'database': 'tudataset',
  1795. 'reference': '[4,6]',
  1796. 'dataset_size': 1113,
  1797. 'class_number': 2,
  1798. 'task_type': 'classification',
  1799. 'ave_node_num': 39.06,
  1800. 'ave_edge_num': 72.82,
  1801. 'node_labeled': True,
  1802. 'edge_labeled': False,
  1803. 'node_attr_dim': 29,
  1804. 'geometry': None,
  1805. 'edge_attr_dim': 0,
  1806. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PROTEINS_full.zip',
  1807. 'domain': 'bioinformatics',
  1808. },
  1809. ### computer vision
  1810. 'COIL-DEL': {
  1811. 'database': 'tudataset',
  1812. 'reference': '[16,18]',
  1813. 'dataset_size': 3900,
  1814. 'class_number': 100,
  1815. 'task_type': 'classification',
  1816. 'ave_node_num': 21.54,
  1817. 'ave_edge_num': 54.24,
  1818. 'node_labeled': False,
  1819. 'edge_labeled': True,
  1820. 'node_attr_dim': 2,
  1821. 'geometry': None,
  1822. 'edge_attr_dim': 0,
  1823. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COIL-DEL.zip',
  1824. 'domain': 'computer vision',
  1825. },
  1826. 'COIL-RAG': {
  1827. 'database': 'tudataset',
  1828. 'reference': '[16,18]',
  1829. 'dataset_size': 3900,
  1830. 'class_number': 100,
  1831. 'task_type': 'classification',
  1832. 'ave_node_num': 3.01,
  1833. 'ave_edge_num': 3.02,
  1834. 'node_labeled': False,
  1835. 'edge_labeled': False,
  1836. 'node_attr_dim': 64,
  1837. 'geometry': None,
  1838. 'edge_attr_dim': 1,
  1839. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COIL-RAG.zip',
  1840. 'domain': 'computer vision',
  1841. },
  1842. 'Cuneiform': {
  1843. 'database': 'tudataset',
  1844. 'reference': '[25]',
  1845. 'dataset_size': 267,
  1846. 'class_number': 30,
  1847. 'task_type': 'classification',
  1848. 'ave_node_num': 21.27,
  1849. 'ave_edge_num': 44.8,
  1850. 'node_labeled': True,
  1851. 'edge_labeled': True,
  1852. 'node_attr_dim': 3,
  1853. 'geometry': '3D',
  1854. 'edge_attr_dim': 2,
  1855. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Cuneiform.zip',
  1856. 'domain': 'computer vision',
  1857. },
  1858. 'Fingerprint': {
  1859. 'database': 'tudataset',
  1860. 'reference': '[16,19]',
  1861. 'dataset_size': 2800,
  1862. 'class_number': 4,
  1863. 'task_type': 'classification',
  1864. 'ave_node_num': 5.42,
  1865. 'ave_edge_num': 4.42,
  1866. 'node_labeled': False,
  1867. 'edge_labeled': False,
  1868. 'node_attr_dim': 2,
  1869. 'geometry': '2D',
  1870. 'edge_attr_dim': 2,
  1871. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Fingerprint.zip',
  1872. 'domain': 'computer vision',
  1873. },
  1874. 'FIRSTMM_DB': {
  1875. 'database': 'tudataset',
  1876. 'reference': '[11,12,13]',
  1877. 'dataset_size': 41,
  1878. 'class_number': 11,
  1879. 'task_type': 'classification',
  1880. 'ave_node_num': 1377.27,
  1881. 'ave_edge_num': 3074.1,
  1882. 'node_labeled': True,
  1883. 'edge_labeled': False,
  1884. 'node_attr_dim': 1,
  1885. 'geometry': None,
  1886. 'edge_attr_dim': 2,
  1887. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/FIRSTMM_DB.zip',
  1888. 'domain': 'computer vision',
  1889. },
  1890. 'Letter-high': {
  1891. 'database': 'tudataset',
  1892. 'reference': '[16]',
  1893. 'dataset_size': 2250,
  1894. 'class_number': 15,
  1895. 'task_type': 'classification',
  1896. 'ave_node_num': 4.67,
  1897. 'ave_edge_num': 4.5,
  1898. 'node_labeled': False,
  1899. 'edge_labeled': False,
  1900. 'node_attr_dim': 2,
  1901. 'geometry': '2D',
  1902. 'edge_attr_dim': 0,
  1903. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-high.zip',
  1904. 'domain': 'computer vision',
  1905. },
  1906. 'Letter-low': {
  1907. 'database': 'tudataset',
  1908. 'reference': '[16]',
  1909. 'dataset_size': 2250,
  1910. 'class_number': 15,
  1911. 'task_type': 'classification',
  1912. 'ave_node_num': 4.68,
  1913. 'ave_edge_num': 3.13,
  1914. 'node_labeled': False,
  1915. 'edge_labeled': False,
  1916. 'node_attr_dim': 2,
  1917. 'geometry': '2D',
  1918. 'edge_attr_dim': 0,
  1919. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-low.zip',
  1920. 'domain': 'computer vision',
  1921. },
  1922. 'Letter-med': {
  1923. 'database': 'tudataset',
  1924. 'reference': '[16]',
  1925. 'dataset_size': 2250,
  1926. 'class_number': 15,
  1927. 'task_type': 'classification',
  1928. 'ave_node_num': 4.67,
  1929. 'ave_edge_num': 4.5,
  1930. 'node_labeled': False,
  1931. 'edge_labeled': False,
  1932. 'node_attr_dim': 2,
  1933. 'geometry': '2D',
  1934. 'edge_attr_dim': 0,
  1935. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-med.zip',
  1936. 'domain': 'computer vision',
  1937. },
  1938. 'MSRC_9': {
  1939. 'database': 'tudataset',
  1940. 'reference': '[13]',
  1941. 'dataset_size': 221,
  1942. 'class_number': 8,
  1943. 'task_type': 'classification',
  1944. 'ave_node_num': 40.58,
  1945. 'ave_edge_num': 97.94,
  1946. 'node_labeled': True,
  1947. 'edge_labeled': False,
  1948. 'node_attr_dim': 0,
  1949. 'geometry': None,
  1950. 'edge_attr_dim': 0,
  1951. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_9.zip',
  1952. 'domain': 'computer vision',
  1953. },
  1954. 'MSRC_21': {
  1955. 'database': 'tudataset',
  1956. 'reference': '[13]',
  1957. 'dataset_size': 563,
  1958. 'class_number': 20,
  1959. 'task_type': 'classification',
  1960. 'ave_node_num': 77.52,
  1961. 'ave_edge_num': 198.32,
  1962. 'node_labeled': True,
  1963. 'edge_labeled': False,
  1964. 'node_attr_dim': 0,
  1965. 'geometry': None,
  1966. 'edge_attr_dim': 0,
  1967. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_21.zip',
  1968. 'domain': 'computer vision',
  1969. },
  1970. 'MSRC_21C': {
  1971. 'database': 'tudataset',
  1972. 'reference': '[13]',
  1973. 'dataset_size': 209,
  1974. 'class_number': 20,
  1975. 'task_type': 'classification',
  1976. 'ave_node_num': 40.28,
  1977. 'ave_edge_num': 96.6,
  1978. 'node_labeled': True,
  1979. 'edge_labeled': False,
  1980. 'node_attr_dim': 0,
  1981. 'geometry': None,
  1982. 'edge_attr_dim': 0,
  1983. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_21C.zip',
  1984. 'domain': 'computer vision',
  1985. },
  1986. ### social networks
  1987. 'COLLAB': {
  1988. 'database': 'tudataset',
  1989. 'reference': '[14]',
  1990. 'dataset_size': 5000,
  1991. 'class_number': 3,
  1992. 'task_type': 'classification',
  1993. 'ave_node_num': 74.49,
  1994. 'ave_edge_num': 2457.78,
  1995. 'node_labeled': False,
  1996. 'edge_labeled': False,
  1997. 'node_attr_dim': 0,
  1998. 'geometry': None,
  1999. 'edge_attr_dim': 0,
  2000. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COLLAB.zip',
  2001. 'domain': 'social networks',
  2002. },
  2003. 'dblp_ct1': {
  2004. 'database': 'tudataset',
  2005. 'reference': '[32]',
  2006. 'dataset_size': 755,
  2007. 'class_number': 2,
  2008. 'task_type': 'classification',
  2009. 'ave_node_num': 52.87,
  2010. 'ave_edge_num': 320.09,
  2011. 'node_labeled': False,
  2012. 'edge_labeled': False,
  2013. 'node_attr_dim': 0,
  2014. 'geometry': None,
  2015. 'edge_attr_dim': 'temporal',
  2016. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/dblp_ct1.zip',
  2017. 'domain': 'social networks',
  2018. },
  2019. 'dblp_ct2': {
  2020. 'database': 'tudataset',
  2021. 'reference': '[32]',
  2022. 'dataset_size': 755,
  2023. 'class_number': 2,
  2024. 'task_type': 'classification',
  2025. 'ave_node_num': 52.87,
  2026. 'ave_edge_num': 320.09,
  2027. 'node_labeled': False,
  2028. 'edge_labeled': False,
  2029. 'node_attr_dim': 0,
  2030. 'geometry': None,
  2031. 'edge_attr_dim': 'temporal',
  2032. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/dblp_ct2.zip',
  2033. 'domain': 'social networks',
  2034. },
  2035. 'DBLP_v1': {
  2036. 'database': 'tudataset',
  2037. 'reference': '[26]',
  2038. 'dataset_size': 19456,
  2039. 'class_number': 2,
  2040. 'task_type': 'classification',
  2041. 'ave_node_num': 10.48,
  2042. 'ave_edge_num': 19.65,
  2043. 'node_labeled': True,
  2044. 'edge_labeled': True,
  2045. 'node_attr_dim': 0,
  2046. 'geometry': None,
  2047. 'edge_attr_dim': 0,
  2048. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DBLP_v1.zip',
  2049. 'domain': 'social networks',
  2050. },
  2051. 'deezer_ego_nets': {
  2052. 'database': 'tudataset',
  2053. 'reference': '[30]',
  2054. 'dataset_size': 9629,
  2055. 'class_number': 2,
  2056. 'task_type': 'classification',
  2057. 'ave_node_num': 23.49,
  2058. 'ave_edge_num': 65.25,
  2059. 'node_labeled': False,
  2060. 'edge_labeled': False,
  2061. 'node_attr_dim': 0,
  2062. 'geometry': None,
  2063. 'edge_attr_dim': 0,
  2064. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/deezer_ego_nets.zip',
  2065. 'domain': 'social networks',
  2066. },
  2067. 'facebook_ct1': {
  2068. 'database': 'tudataset',
  2069. 'reference': '[32]',
  2070. 'dataset_size': 995,
  2071. 'class_number': 2,
  2072. 'task_type': 'classification',
  2073. 'ave_node_num': 95.72,
  2074. 'ave_edge_num': 269.01,
  2075. 'node_labeled': False,
  2076. 'edge_labeled': False,
  2077. 'node_attr_dim': 0,
  2078. 'geometry': None,
  2079. 'edge_attr_dim': 'temporal',
  2080. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/facebook_ct1.zip',
  2081. 'domain': 'social networks',
  2082. },
  2083. 'facebook_ct2': {
  2084. 'database': 'tudataset',
  2085. 'reference': '[32]',
  2086. 'dataset_size': 995,
  2087. 'class_number': 2,
  2088. 'task_type': 'classification',
  2089. 'ave_node_num': 95.72,
  2090. 'ave_edge_num': 269.01,
  2091. 'node_labeled': False,
  2092. 'edge_labeled': False,
  2093. 'node_attr_dim': 0,
  2094. 'geometry': None,
  2095. 'edge_attr_dim': 'temporal',
  2096. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/facebook_ct2.zip',
  2097. 'domain': 'social networks',
  2098. },
  2099. 'github_stargazers': {
  2100. 'database': 'tudataset',
  2101. 'reference': '[30]',
  2102. 'dataset_size': 12725,
  2103. 'class_number': 2,
  2104. 'task_type': 'classification',
  2105. 'ave_node_num': 113.79,
  2106. 'ave_edge_num': 234.64,
  2107. 'node_labeled': False,
  2108. 'edge_labeled': False,
  2109. 'node_attr_dim': 0,
  2110. 'geometry': None,
  2111. 'edge_attr_dim': 0,
  2112. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/github_stargazers.zip',
  2113. 'domain': 'social networks',
  2114. },
  2115. 'highschool_ct1': {
  2116. 'database': 'tudataset',
  2117. 'reference': '[32]',
  2118. 'dataset_size': 180,
  2119. 'class_number': 2,
  2120. 'task_type': 'classification',
  2121. 'ave_node_num': 52.32,
  2122. 'ave_edge_num': 544.81,
  2123. 'node_labeled': False,
  2124. 'edge_labeled': False,
  2125. 'node_attr_dim': 0,
  2126. 'geometry': None,
  2127. 'edge_attr_dim': 'temporal',
  2128. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/highschool_ct1.zip',
  2129. 'domain': 'social networks',
  2130. },
  2131. 'highschool_ct2': {
  2132. 'database': 'tudataset',
  2133. 'reference': '[32]',
  2134. 'dataset_size': 180,
  2135. 'class_number': 2,
  2136. 'task_type': 'classification',
  2137. 'ave_node_num': 52.32,
  2138. 'ave_edge_num': 544.81,
  2139. 'node_labeled': False,
  2140. 'edge_labeled': False,
  2141. 'node_attr_dim': 0,
  2142. 'geometry': None,
  2143. 'edge_attr_dim': 'temporal',
  2144. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/highschool_ct2.zip',
  2145. 'domain': 'social networks',
  2146. },
  2147. 'IMDB-BINARY': {
  2148. 'database': 'tudataset',
  2149. 'reference': '[14]',
  2150. 'dataset_size': 1000,
  2151. 'class_number': 2,
  2152. 'task_type': 'classification',
  2153. 'ave_node_num': 19.77,
  2154. 'ave_edge_num': 96.53,
  2155. 'node_labeled': False,
  2156. 'edge_labeled': False,
  2157. 'node_attr_dim': 0,
  2158. 'geometry': '',
  2159. 'edge_attr_dim': 0,
  2160. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/IMDB-BINARY.zip',
  2161. 'domain': 'social networks',
  2162. },
  2163. 'IMDB-MULTI': {
  2164. 'database': 'tudataset',
  2165. 'reference': '[14]',
  2166. 'dataset_size': 1500,
  2167. 'class_number': 3,
  2168. 'task_type': 'classification',
  2169. 'ave_node_num': 13.0,
  2170. 'ave_edge_num': 65.94,
  2171. 'node_labeled': False,
  2172. 'edge_labeled': False,
  2173. 'node_attr_dim': 0,
  2174. 'geometry': '',
  2175. 'edge_attr_dim': 0,
  2176. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/IMDB-MULTI.zip',
  2177. 'domain': 'social networks',
  2178. },
  2179. 'infectious_ct1': {
  2180. 'database': 'tudataset',
  2181. 'reference': '[32]',
  2182. 'dataset_size': 200,
  2183. 'class_number': 2,
  2184. 'task_type': 'classification',
  2185. 'ave_node_num': 50.0,
  2186. 'ave_edge_num': 459.72,
  2187. 'node_labeled': False,
  2188. 'edge_labeled': False,
  2189. 'node_attr_dim': 0,
  2190. 'geometry': None,
  2191. 'edge_attr_dim': 'temporal',
  2192. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/infectious_ct1.zip',
  2193. 'domain': 'social networks',
  2194. },
  2195. 'infectious_ct2': {
  2196. 'database': 'tudataset',
  2197. 'reference': '[32]',
  2198. 'dataset_size': 200,
  2199. 'class_number': 2,
  2200. 'task_type': 'classification',
  2201. 'ave_node_num': 50.0,
  2202. 'ave_edge_num': 459.72,
  2203. 'node_labeled': False,
  2204. 'edge_labeled': False,
  2205. 'node_attr_dim': 0,
  2206. 'geometry': None,
  2207. 'edge_attr_dim': 'temporal',
  2208. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/infectious_ct2.zip',
  2209. 'domain': 'social networks',
  2210. },
  2211. 'mit_ct1': {
  2212. 'database': 'tudataset',
  2213. 'reference': '[32]',
  2214. 'dataset_size': 97,
  2215. 'class_number': 2,
  2216. 'task_type': 'classification',
  2217. 'ave_node_num': 20.0,
  2218. 'ave_edge_num': 1469.15,
  2219. 'node_labeled': False,
  2220. 'edge_labeled': False,
  2221. 'node_attr_dim': 0,
  2222. 'geometry': None,
  2223. 'edge_attr_dim': 'temporal',
  2224. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/mit_ct1.zip',
  2225. 'domain': 'social networks',
  2226. },
  2227. 'mit_ct2': {
  2228. 'database': 'tudataset',
  2229. 'reference': '[32]',
  2230. 'dataset_size': 97,
  2231. 'class_number': 2,
  2232. 'task_type': 'classification',
  2233. 'ave_node_num': 20.0,
  2234. 'ave_edge_num': 1469.15,
  2235. 'node_labeled': False,
  2236. 'edge_labeled': False,
  2237. 'node_attr_dim': 0,
  2238. 'geometry': None,
  2239. 'edge_attr_dim': 'temporal',
  2240. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/mit_ct2.zip',
  2241. 'domain': 'social networks',
  2242. },
  2243. 'REDDIT-BINARY': {
  2244. 'database': 'tudataset',
  2245. 'reference': '[14]',
  2246. 'dataset_size': 2000,
  2247. 'class_number': 2,
  2248. 'task_type': 'classification',
  2249. 'ave_node_num': 429.63,
  2250. 'ave_edge_num': 497.75,
  2251. 'node_labeled': False,
  2252. 'edge_labeled': False,
  2253. 'node_attr_dim': 0,
  2254. 'geometry': None,
  2255. 'edge_attr_dim': 0,
  2256. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-BINARY.zip',
  2257. 'domain': 'social networks',
  2258. },
  2259. 'REDDIT-MULTI-5K': {
  2260. 'database': 'tudataset',
  2261. 'reference': '[14]',
  2262. 'dataset_size': 4999,
  2263. 'class_number': 5,
  2264. 'task_type': 'classification',
  2265. 'ave_node_num': 508.52,
  2266. 'ave_edge_num': 594.87,
  2267. 'node_labeled': False,
  2268. 'edge_labeled': False,
  2269. 'node_attr_dim': 0,
  2270. 'geometry': None,
  2271. 'edge_attr_dim': 0,
  2272. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-MULTI-5K.zip',
  2273. 'domain': 'social networks',
  2274. },
  2275. 'REDDIT-MULTI-12K': {
  2276. 'database': 'tudataset',
  2277. 'reference': '[14]',
  2278. 'dataset_size': 11929,
  2279. 'class_number': 11,
  2280. 'task_type': 'classification',
  2281. 'ave_node_num': 391.41,
  2282. 'ave_edge_num': 456.89,
  2283. 'node_labeled': False,
  2284. 'edge_labeled': False,
  2285. 'node_attr_dim': 0,
  2286. 'geometry': None,
  2287. 'edge_attr_dim': 0,
  2288. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-MULTI-12K.zip',
  2289. 'domain': 'social networks',
  2290. },
  2291. 'reddit_threads': {
  2292. 'database': 'tudataset',
  2293. 'reference': '[30]',
  2294. 'dataset_size': 203088,
  2295. 'class_number': 2,
  2296. 'task_type': 'classification',
  2297. 'ave_node_num': 23.93,
  2298. 'ave_edge_num': 24.99,
  2299. 'node_labeled': False,
  2300. 'edge_labeled': False,
  2301. 'node_attr_dim': 0,
  2302. 'geometry': None,
  2303. 'edge_attr_dim': 0,
  2304. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/reddit_threads.zip',
  2305. 'domain': 'social networks',
  2306. },
  2307. 'tumblr_ct1': {
  2308. 'database': 'tudataset',
  2309. 'reference': '[32]',
  2310. 'dataset_size': 373,
  2311. 'class_number': 2,
  2312. 'task_type': 'classification',
  2313. 'ave_node_num': 53.11,
  2314. 'ave_edge_num': 199.78,
  2315. 'node_labeled': False,
  2316. 'edge_labeled': False,
  2317. 'node_attr_dim': 0,
  2318. 'geometry': None,
  2319. 'edge_attr_dim': 'temporal',
  2320. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/tumblr_ct1.zip',
  2321. 'domain': 'social networks',
  2322. },
  2323. 'tumblr_ct2': {
  2324. 'database': 'tudataset',
  2325. 'reference': '[32]',
  2326. 'dataset_size': 373,
  2327. 'class_number': 2,
  2328. 'task_type': 'classification',
  2329. 'ave_node_num': 53.11,
  2330. 'ave_edge_num': 199.78,
  2331. 'node_labeled': False,
  2332. 'edge_labeled': False,
  2333. 'node_attr_dim': 0,
  2334. 'geometry': None,
  2335. 'edge_attr_dim': 'temporal',
  2336. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/tumblr_ct2.zip',
  2337. 'domain': 'social networks',
  2338. },
  2339. 'twitch_egos': {
  2340. 'database': 'tudataset',
  2341. 'reference': '[30]',
  2342. 'dataset_size': 127094,
  2343. 'class_number': 2,
  2344. 'task_type': 'classification',
  2345. 'ave_node_num': 29.67,
  2346. 'ave_edge_num': 86.59,
  2347. 'node_labeled': False,
  2348. 'edge_labeled': False,
  2349. 'node_attr_dim': 0,
  2350. 'geometry': None,
  2351. 'edge_attr_dim': 0,
  2352. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/twitch_egos.zip',
  2353. 'domain': 'social networks',
  2354. },
  2355. 'TWITTER-Real-Graph-Partial': {
  2356. 'database': 'tudataset',
  2357. 'reference': '[26]',
  2358. 'dataset_size': 144033,
  2359. 'class_number': 2,
  2360. 'task_type': 'classification',
  2361. 'ave_node_num': 4.03,
  2362. 'ave_edge_num': 4.98,
  2363. 'node_labeled': True,
  2364. 'edge_labeled': False,
  2365. 'node_attr_dim': 0,
  2366. 'geometry': None,
  2367. 'edge_attr_dim': 1,
  2368. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/TWITTER-Real-Graph-Partial.zip',
  2369. 'domain': 'social networks',
  2370. },
  2371. ### synthetic
  2372. 'COLORS-3': {
  2373. 'database': 'tudataset',
  2374. 'reference': '[27]',
  2375. 'dataset_size': 10500,
  2376. 'class_number': 11,
  2377. 'task_type': 'classification',
  2378. 'ave_node_num': 61.31,
  2379. 'ave_edge_num': 91.03,
  2380. 'node_labeled': False,
  2381. 'edge_labeled': False,
  2382. 'node_attr_dim': 4,
  2383. 'geometry': None,
  2384. 'edge_attr_dim': 0,
  2385. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COLORS-3.zip',
  2386. 'domain': 'synthetic',
  2387. },
  2388. 'SYNTHETIC': {
  2389. 'database': 'tudataset',
  2390. 'reference': '[3]',
  2391. 'dataset_size': 300,
  2392. 'class_number': 2,
  2393. 'task_type': 'classification',
  2394. 'ave_node_num': 100.0,
  2395. 'ave_edge_num': 196.0,
  2396. 'node_labeled': False,
  2397. 'edge_labeled': False,
  2398. 'node_attr_dim': 1,
  2399. 'geometry': None,
  2400. 'edge_attr_dim': 0,
  2401. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SYNTHETIC.zip',
  2402. 'domain': 'synthetic',
  2403. },
  2404. 'SYNTHETICnew': {
  2405. 'database': 'tudataset',
  2406. 'reference': '[3,10]',
  2407. 'dataset_size': 300,
  2408. 'class_number': 2,
  2409. 'task_type': 'classification',
  2410. 'ave_node_num': 100.0,
  2411. 'ave_edge_num': 196.25,
  2412. 'node_labeled': False,
  2413. 'edge_labeled': False,
  2414. 'node_attr_dim': 1,
  2415. 'geometry': None,
  2416. 'edge_attr_dim': 0,
  2417. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SYNTHETICnew.zip',
  2418. 'domain': 'synthetic',
  2419. },
  2420. 'Synthie': {
  2421. 'database': 'tudataset',
  2422. 'reference': '[21]',
  2423. 'dataset_size': 400,
  2424. 'class_number': 4,
  2425. 'task_type': 'classification',
  2426. 'ave_node_num': 95.0,
  2427. 'ave_edge_num': 172.93,
  2428. 'node_labeled': False,
  2429. 'edge_labeled': False,
  2430. 'node_attr_dim': 15,
  2431. 'geometry': None,
  2432. 'edge_attr_dim': 0,
  2433. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Synthie.zip',
  2434. 'domain': 'synthetic',
  2435. },
  2436. 'TRIANGLES': {
  2437. 'database': 'tudataset',
  2438. 'reference': '[27]',
  2439. 'dataset_size': 45000,
  2440. 'class_number': 10,
  2441. 'task_type': 'classification',
  2442. 'ave_node_num': 20.85,
  2443. 'ave_edge_num': 32.74,
  2444. 'node_labeled': False,
  2445. 'edge_labeled': False,
  2446. 'node_attr_dim': 0,
  2447. 'geometry': None,
  2448. 'edge_attr_dim': 0,
  2449. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/TRIANGLES.zip',
  2450. 'domain': 'synthetic',
  2451. },
  2452. }
  2453. DATASET_META = {**GREYC_META, **IAM_META, **TUDataset_META}
  2454. def list_of_databases():
  2455. """List names of all databases.
  2456. Returns
  2457. -------
  2458. list
  2459. The list of all databases.
  2460. """
  2461. return [i for i in DATABASES]
  2462. def list_of_datasets():
  2463. """List names of all datasets.
  2464. Returns
  2465. -------
  2466. list
  2467. The list of all datasets.
  2468. """
  2469. return [i for i in DATASET_META]

A Python package for graph kernels, graph edit distances and graph pre-image problem.