|
12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489 |
- #!/usr/bin/env python3
- # -*- coding: utf-8 -*-
- """
- Created on Tue Oct 20 14:25:49 2020
-
- @author: ljia
- """
-
- DATABASES = {
- 'greyc': 'https://brunl01.users.greyc.fr/CHEMISTRY/',
- 'iam': 'https://iapr-tc15.greyc.fr/IAM/',
- 'tudataset': 'http://graphlearning.io/docs/datasets/',
- }
-
-
- ### -------- database greyc -------- ###
- GREYC_META = {
- 'ACE': {
- 'database': 'greyc',
- 'reference': None,
- 'dataset_size': 32,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 52,
- 'ave_edge_num': None,
- 'node_labeled': None,
- 'edge_labeled': None,
- 'node_attr_dim': None,
- 'geometry': None,
- 'edge_attr_dim': None,
- 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/ACEDataset.tar',
- 'domain': 'small molecules',
- 'train_valid_test': [],
- 'stereoisomerism': True,
- 'load_files': ['data.ds'],
- 'extra_params': {'gformat': 'cml'}
- },
- 'Acyclic': {
- 'database': 'greyc',
- 'reference': None,
- 'dataset_size': 183,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 8.15,
- 'ave_edge_num': 7.15,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/Acyclic.tar.gz',
- 'domain': 'small molecules',
- 'train_valid_test': None,
- 'stereoisomerism': False,
- 'load_files': ['dataset_bps.ds'],
- },
- 'AIDS_greyc': {
- 'database': 'greyc',
- 'reference': None,
- 'dataset_size': 2000,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 15.69,
- 'ave_edge_num': 16.20,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': None,
- 'geometry': None,
- 'edge_attr_dim': None,
- 'url': 'https://iapr-tc15.greyc.fr/IAM/AIDS.zip',
- 'domain': 'small molecules',
- 'train_valid_test': ['data/train.cxl', 'data/valid.cxl', 'data/test.cxl',],
- 'stereoisomerism': False,
- 'load_files': ['data/'],
- },
- 'Alkane': {
- 'database': 'greyc',
- 'reference': None,
- 'dataset_size': 150,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 8.87,
- 'ave_edge_num': 7.87,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/alkane_dataset.tar.gz',
- 'domain': 'small molecules',
- 'train_valid_test': None,
- 'stereoisomerism': False,
- 'load_files': ['dataset.ds', 'dataset_boiling_point_names.txt'],
- },
- 'Chiral': {
- 'database': 'greyc',
- 'reference': None,
- 'dataset_size': 35,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 21.29,
- 'ave_edge_num': None,
- 'node_labeled': None,
- 'edge_labeled': None,
- 'node_attr_dim': None,
- 'geometry': None,
- 'edge_attr_dim': None,
- 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/DatasetAcyclicChiral.tar',
- 'domain': 'small molecules',
- 'train_valid_test': [],
- 'stereoisomerism': True,
- 'load_files': ['data.txt'],
- 'extra_params': {'gformat': 'cml'}
- },
- 'MAO': {
- 'database': 'greyc',
- 'reference': None,
- 'dataset_size': 68,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 18.38,
- 'ave_edge_num': 19.63,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/mao.tgz',
- 'domain': 'small molecules',
- 'train_valid_test': None,
- 'stereoisomerism': False,
- 'load_files': ['dataset.ds'],
- },
- 'Monoterpenoides': {
- 'database': 'greyc',
- 'reference': None,
- 'dataset_size': 382,
- 'class_number': 10,
- 'task_type': 'classification',
- 'ave_node_num': 10,
- 'ave_edge_num': None,
- 'node_labeled': None,
- 'edge_labeled': None,
- 'node_attr_dim': None,
- 'geometry': None,
- 'edge_attr_dim': None,
- 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/monoterpenoides.tar.gz',
- 'domain': 'small molecules',
- 'train_valid_test': None,
- 'stereoisomerism': False,
- 'load_files': ['dataset_10+.ds'],
- },
- 'PAH': {
- 'database': 'greyc',
- 'reference': None,
- 'dataset_size': 94,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 20.7,
- 'ave_edge_num': 24.43,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/PAH.tar.gz',
- 'domain': 'small molecules',
- 'train_valid_test': ['trainset_0.ds', None, 'testset_0.ds'],
- 'stereoisomerism': False,
- 'load_files': [['trainset_0.ds', 'testset_0.ds']],
- },
- 'PTC': {
- 'database': 'greyc',
- 'reference': None,
- 'dataset_size': 416,
- 'class_number': None,
- 'task_type': 'classification',
- 'ave_node_num': 14.4,
- 'ave_edge_num': None,
- 'node_labeled': None,
- 'edge_labeled': None,
- 'node_attr_dim': None,
- 'geometry': None,
- 'edge_attr_dim': None,
- 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/ptc.tgz',
- 'domain': 'small molecules',
- 'train_valid_test': None,
- 'stereoisomerism': False,
- 'load_files': [],
- 'extra_info': 'This dataset has test and train datasets. Select gender between mm, fm, mr, fr. \ndataloader = DataLoader(\'Ptc\',root = ..., option = \'mm\') \ntest,train = dataloader.dataset \nGs_test, y_test = test \nGs_train_, y_train = train',
- },
- 'Steroid': {
- 'database': 'greyc',
- 'reference': None,
- 'dataset_size': 64,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 75.11,
- 'ave_edge_num': None,
- 'node_labeled': None,
- 'edge_labeled': None,
- 'node_attr_dim': None,
- 'geometry': None,
- 'edge_attr_dim': None,
- 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/SteroidDataset.tar',
- 'domain': 'small molecules',
- 'train_valid_test': ['trainset_0.ds', None, 'testset_0.ds'],
- 'stereoisomerism': False,
- 'load_files': ['dataWithOutsider.ds'],
- 'extra_params': {'gformat': 'cml'}
- },
- 'Vitamin_D': {
- 'database': 'greyc',
- 'reference': None,
- 'dataset_size': 69,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 76.91,
- 'ave_edge_num': None,
- 'node_labeled': None,
- 'edge_labeled': None,
- 'node_attr_dim': None,
- 'geometry': None,
- 'edge_attr_dim': None,
- 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/DatasetVitamin.tar',
- 'domain': 'small molecules',
- 'train_valid_test': [],
- 'stereoisomerism': True,
- 'load_files': ['data.txt'],
- 'extra_params': {'gformat': 'cml'}
- },
- }
-
-
- ### -------- database iam -------- ###
- # @todo: several datasets in this database are included in TUDataset. However they do not include train/valid/test sets.
- IAM_META = {
- 'GREC': {
- 'database': 'iam',
- 'reference': None,
- 'dataset_size': None,
- 'class_number': None,
- 'task_type': None,
- 'ave_node_num': None,
- 'ave_edge_num': None,
- 'node_labeled': None,
- 'edge_labeled': None,
- 'node_attr_dim': None,
- 'geometry': None,
- 'edge_attr_dim': None,
- 'url': 'https://iapr-tc15.greyc.fr/IAM/GREC.zip',
- 'domain': None,
- 'train_valid_test': ['data/test.cxl','data/train.cxl', 'data/valid.cxl'],
- 'load_files': [['data/test.cxl','data/train.cxl', 'data/valid.cxl']],
- },
- 'Web': {
- 'database': 'iam',
- 'reference': None,
- 'dataset_size': None,
- 'class_number': None,
- 'task_type': None,
- 'ave_node_num': None,
- 'ave_edge_num': None,
- 'node_labeled': None,
- 'edge_labeled': None,
- 'node_attr_dim': None,
- 'geometry': None,
- 'edge_attr_dim': None,
- 'url': 'https://iapr-tc15.greyc.fr/IAM/Web.zip',
- 'domain': None,
- 'train_valid_test': ['data/test.cxl', 'data/train.cxl', 'data/valid.cxl'],
- 'load_files': [['data/test.cxl','data/train.cxl', 'data/valid.cxl']],
- },
- }
-
-
- ### -------- database tudataset -------- ###
- TUDataset_META = {
- ### small molecules
- 'AIDS': {
- 'database': 'tudataset',
- 'reference': '[16,17]',
- 'dataset_size': 2000,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 15.69,
- 'ave_edge_num': 16.2,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 4,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/AIDS.zip',
- 'domain': 'small molecules',
- },
- 'alchemy_full': {
- 'database': 'tudataset',
- 'reference': '[29]',
- 'dataset_size': 202579,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 10.1,
- 'ave_edge_num': 10.44,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 3,
- 'geometry': '3D, RI',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/alchemy_full.zip',
- 'domain': 'small molecules',
- },
- 'aspirin': {
- 'database': 'tudataset',
- 'reference': '[36]',
- 'dataset_size': 111763,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 21.0,
- 'ave_edge_num': 151.52,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 6,
- 'geometry': '3D, RI',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/aspirin.zip',
- 'domain': 'small molecules',
- },
- 'benzene': {
- 'database': 'tudataset',
- 'reference': '[36]',
- 'dataset_size': 527984,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 12.0,
- 'ave_edge_num': 64.94,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 6,
- 'geometry': '3D, RI',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/benzene.zip',
- 'domain': 'small molecules',
- },
- 'BZR': {
- 'database': 'tudataset',
- 'reference': '[7]',
- 'dataset_size': 405,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 35.75,
- 'ave_edge_num': 38.36,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 3,
- 'geometry': '3D, RI',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/BZR.zip',
- 'domain': 'small molecules',
- },
- 'BZR_MD': {
- 'database': 'tudataset',
- 'reference': '[7,23]',
- 'dataset_size': 306,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 21.3,
- 'ave_edge_num': 225.06,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 1,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/BZR_MD.zip',
- 'domain': 'small molecules',
- },
- 'COX2': {
- 'database': 'tudataset',
- 'reference': '[7]',
- 'dataset_size': 467,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 41.22,
- 'ave_edge_num': 43.45,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 3,
- 'geometry': '3D, RI',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COX2.zip',
- 'domain': 'small molecules',
- },
- 'COX2_MD': {
- 'database': 'tudataset',
- 'reference': '[7,23]',
- 'dataset_size': 303,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 26.28,
- 'ave_edge_num': 335.12,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 1,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COX2_MD.zip',
- 'domain': 'small molecules',
- },
- 'DHFR': {
- 'database': 'tudataset',
- 'reference': '[7]',
- 'dataset_size': 467,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 42.43,
- 'ave_edge_num': 44.54,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 3,
- 'geometry': '3D, RI',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DHFR.zip',
- 'domain': 'small molecules',
- },
- 'DHFR_MD': {
- 'database': 'tudataset',
- 'reference': '[7,23]',
- 'dataset_size': 393,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 23.87,
- 'ave_edge_num': 283.01,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 1,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DHFR_MD.zip',
- 'domain': 'small molecules',
- },
- 'ER_MD': {
- 'database': 'tudataset',
- 'reference': '[7,23]',
- 'dataset_size': 446,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 21.33,
- 'ave_edge_num': 234.85,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 1,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ER_MD.zip',
- 'domain': 'small molecules',
- },
- 'ethanol': {
- 'database': 'tudataset',
- 'reference': '[36]',
- 'dataset_size': 455093,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 9.0,
- 'ave_edge_num': 36.0,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 6,
- 'geometry': '3D, RI',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ethanol.zip',
- 'domain': 'small molecules',
- },
- 'FRANKENSTEIN': {
- 'database': 'tudataset',
- 'reference': '[15]',
- 'dataset_size': 4337,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 16.9,
- 'ave_edge_num': 17.88,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 780,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/FRANKENSTEIN.zip',
- 'domain': 'small molecules',
- },
- 'malonaldehyde': {
- 'database': 'tudataset',
- 'reference': '[36]',
- 'dataset_size': 893238,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 9.0,
- 'ave_edge_num': 36.0,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 6,
- 'geometry': '3D, RI',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/malonaldehyde.zip',
- 'domain': 'small molecules',
- },
- 'MCF-7': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 27770,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 26.39,
- 'ave_edge_num': 28.52,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MCF-7.zip',
- 'domain': 'small molecules',
- },
- 'MCF-7H': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 27770,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 47.3,
- 'ave_edge_num': 49.43,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MCF-7H.zip',
- 'domain': 'small molecules',
- },
- 'MOLT-4': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 39765,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 26.09,
- 'ave_edge_num': 28.13,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MOLT-4.zip',
- 'domain': 'small molecules',
- },
- 'MOLT-4H': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 39765,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 46.7,
- 'ave_edge_num': 48.73,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MOLT-4H.zip',
- 'domain': 'small molecules',
- },
- 'Mutagenicity': {
- 'database': 'tudataset',
- 'reference': '[16,20]',
- 'dataset_size': 4337,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 30.32,
- 'ave_edge_num': 30.77,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Mutagenicity.zip',
- 'domain': 'small molecules',
- },
- 'MUTAG': {
- 'database': 'tudataset',
- 'reference': '[1,23]',
- 'dataset_size': 188,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.93,
- 'ave_edge_num': 19.79,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MUTAG.zip',
- 'domain': 'small molecules',
- },
- 'naphthalene': {
- 'database': 'tudataset',
- 'reference': '[36]',
- 'dataset_size': 226256,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 18.0,
- 'ave_edge_num': 127.37,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 6,
- 'geometry': '3D, RI',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/naphthalene.zip',
- 'domain': 'small molecules',
- },
- 'NCI1': {
- 'database': 'tudataset',
- 'reference': '[8,9,22]',
- 'dataset_size': 4110,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 29.87,
- 'ave_edge_num': 32.3,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI1.zip',
- 'domain': 'small molecules',
- },
- 'NCI109': {
- 'database': 'tudataset',
- 'reference': '[8,9,22]',
- 'dataset_size': 4127,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 29.68,
- 'ave_edge_num': 32.13,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI109.zip',
- 'domain': 'small molecules',
- },
- 'NCI-H23': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 40353,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 26.07,
- 'ave_edge_num': 28.1,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI-H23.zip',
- 'domain': 'small molecules',
- },
- 'NCI-H23H': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 40353,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 46.67,
- 'ave_edge_num': 48.69,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI-H23H.zip',
- 'domain': 'small molecules',
- },
- 'OVCAR-8': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 40516,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 26.07,
- 'ave_edge_num': 28.1,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OVCAR-8.zip',
- 'domain': 'small molecules',
- },
- 'OVCAR-8H': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 40516,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 46.67,
- 'ave_edge_num': 48.7,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OVCAR-8H.zip',
- 'domain': 'small molecules',
- },
- 'P388': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 41472,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 22.11,
- 'ave_edge_num': 23.55,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/P388.zip',
- 'domain': 'small molecules',
- },
- 'P388H': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 41472,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 40.44,
- 'ave_edge_num': 41.88,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/P388H.zip',
- 'domain': 'small molecules',
- },
- 'PC-3': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 27509,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 26.35,
- 'ave_edge_num': 28.49,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PC-3.zip',
- 'domain': 'small molecules',
- },
- 'PC-3H': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 27509,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 47.19,
- 'ave_edge_num': 49.32,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PC-3H.zip',
- 'domain': 'small molecules',
- },
- 'PTC_FM': {
- 'database': 'tudataset',
- 'reference': '[2,23]',
- 'dataset_size': 349,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 14.11,
- 'ave_edge_num': 14.48,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_FM.zip',
- 'domain': 'small molecules',
- },
- 'PTC_FR': {
- 'database': 'tudataset',
- 'reference': '[2,23]',
- 'dataset_size': 351,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 14.56,
- 'ave_edge_num': 15.0,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_FR.zip',
- 'domain': 'small molecules',
- },
- 'PTC_MM': {
- 'database': 'tudataset',
- 'reference': '[2,23]',
- 'dataset_size': 336,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 13.97,
- 'ave_edge_num': 14.32,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_MM.zip',
- 'domain': 'small molecules',
- },
- 'PTC_MR': {
- 'database': 'tudataset',
- 'reference': '[2,23]',
- 'dataset_size': 344,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 14.29,
- 'ave_edge_num': 14.69,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_MR.zip',
- 'domain': 'small molecules',
- },
- 'QM9': {
- 'database': 'tudataset',
- 'reference': '[33,34,35]',
- 'dataset_size': 129433,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 18.03,
- 'ave_edge_num': 18.63,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 16,
- 'geometry': '3D, RI',
- 'edge_attr_dim': 4,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/QM9.zip',
- 'domain': 'small molecules',
- },
- 'salicylic_acid': {
- 'database': 'tudataset',
- 'reference': '[36]',
- 'dataset_size': 220232,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 16.0,
- 'ave_edge_num': 104.13,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 6,
- 'geometry': '3D, RI',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/salicylic_acid.zip',
- 'domain': 'small molecules',
- },
- 'SF-295': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 40271,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 26.06,
- 'ave_edge_num': 28.08,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SF-295.zip',
- 'domain': 'small molecules',
- },
- 'SF-295H': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 40271,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 46.65,
- 'ave_edge_num': 48.68,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SF-295H.zip',
- 'domain': 'small molecules',
- },
- 'SN12C': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 40004,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 26.08,
- 'ave_edge_num': 28.11,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SN12C.zip',
- 'domain': 'small molecules',
- },
- 'SN12CH': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 40004,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 46.69,
- 'ave_edge_num': 48.71,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SN12CH.zip',
- 'domain': 'small molecules',
- },
- 'SW-620': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 40532,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 26.05,
- 'ave_edge_num': 28.08,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SW-620.zip',
- 'domain': 'small molecules',
- },
- 'SW-620H': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 40532,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 46.62,
- 'ave_edge_num': 48.65,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SW-620H.zip',
- 'domain': 'small molecules',
- },
- 'toluene': {
- 'database': 'tudataset',
- 'reference': '[36]',
- 'dataset_size': 342791,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 15.0,
- 'ave_edge_num': 96.15,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 6,
- 'geometry': '3D, RI',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/toluene.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_AhR_training': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 8169,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 18.09,
- 'ave_edge_num': 18.5,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_training.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_AhR_testing': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 272,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 22.13,
- 'ave_edge_num': 23.05,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_testing.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_AhR_evaluation': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 607,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.64,
- 'ave_edge_num': 18.06,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_evaluation.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_AR_training': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 9362,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 18.39,
- 'ave_edge_num': 18.84,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_training.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_AR_testing': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 292,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 22.35,
- 'ave_edge_num': 23.32,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_testing.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_AR_evaluation': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 585,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.99,
- 'ave_edge_num': 18.45,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_evaluation.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_AR-LBD_training': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 8599,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.77,
- 'ave_edge_num': 18.16,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_training.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_AR-LBD_testing': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 253,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 21.85,
- 'ave_edge_num': 22.73,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_testing.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_AR-LBD_evaluation': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 580,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.09,
- 'ave_edge_num': 17.42,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_evaluation.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_ARE_training': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 7167,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 16.28,
- 'ave_edge_num': 16.52,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_training.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_ARE_testing': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 234,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 21.99,
- 'ave_edge_num': 22.91,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_testing.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_ARE_evaluation': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 552,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.01,
- 'ave_edge_num': 17.33,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_evaluation.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_aromatase_training': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 7226,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.5,
- 'ave_edge_num': 17.79,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_training.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_aromatase_testing': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 214,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 21.65,
- 'ave_edge_num': 22.36,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_testing.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_aromatase_evaluation': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 528,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 16.74,
- 'ave_edge_num': 16.99,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_evaluation.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_ATAD5_training': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 9091,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.89,
- 'ave_edge_num': 18.3,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_training.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_ATAD5_testing': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 272,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 21.99,
- 'ave_edge_num': 22.89,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_testing.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_ATAD5_evaluation': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 619,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.68,
- 'ave_edge_num': 18.11,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_evaluation.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_ER_training': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 7697,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.58,
- 'ave_edge_num': 17.94,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_training.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_ER_testing': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 265,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 22.16,
- 'ave_edge_num': 23.13,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_testing.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_ER_evaluation': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 515,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.66,
- 'ave_edge_num': 18.1,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_evaluation.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_ER-LBD_training': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 8753,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 18.06,
- 'ave_edge_num': 18.47,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_training.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_ER-LBD_testing': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 287,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 22.28,
- 'ave_edge_num': 23.23,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_testing.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_ER-LBD_evaluation': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 599,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.75,
- 'ave_edge_num': 18.17,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_evaluation.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_HSE_training': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 8150,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 16.72,
- 'ave_edge_num': 17.04,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_training.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_HSE_testing': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 267,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 22.07,
- 'ave_edge_num': 23.0,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_testing.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_HSE_evaluation': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 607,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.61,
- 'ave_edge_num': 18.01,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_evaluation.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_MMP_training': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 7320,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.49,
- 'ave_edge_num': 17.83,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_training.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_MMP_testing': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 238,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 21.68,
- 'ave_edge_num': 22.55,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_testing.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_MMP_evaluation': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 541,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 16.67,
- 'ave_edge_num': 16.88,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_evaluation.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_p53_training': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 8634,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.79,
- 'ave_edge_num': 18.19,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_training.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_p53_testing': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 269,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 22.14,
- 'ave_edge_num': 23.04,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_testing.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_p53_evaluation': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 613,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.34,
- 'ave_edge_num': 17.72,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_evaluation.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_PPAR-gamma_training': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 8184,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.23,
- 'ave_edge_num': 17.55,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_training.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_PPAR-gamma_testing': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 267,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 22.04,
- 'ave_edge_num': 22.93,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_testing.zip',
- 'domain': 'small molecules',
- },
- 'Tox21_PPAR-gamma_evaluation': {
- 'database': 'tudataset',
- 'reference': '[24]',
- 'dataset_size': 602,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 17.38,
- 'ave_edge_num': 17.77,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_evaluation.zip',
- 'domain': 'small molecules',
- },
- 'UACC257': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 39988,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 26.09,
- 'ave_edge_num': 28.12,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/UACC257.zip',
- 'domain': 'small molecules',
- },
- 'UACC257H': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 39988,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 46.68,
- 'ave_edge_num': 48.71,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/UACC257H.zip',
- 'domain': 'small molecules',
- },
- 'uracil': {
- 'database': 'tudataset',
- 'reference': '[36]',
- 'dataset_size': 133770,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 12.0,
- 'ave_edge_num': 64.44,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 6,
- 'geometry': '3D, RI',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/uracil.zip',
- 'domain': 'small molecules',
- },
- 'Yeast': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 79601,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 21.54,
- 'ave_edge_num': 22.84,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Yeast.zip',
- 'domain': 'small molecules',
- },
- 'YeastH': {
- 'database': 'tudataset',
- 'reference': '[28]',
- 'dataset_size': 79601,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 39.44,
- 'ave_edge_num': 40.74,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/YeastH.zip',
- 'domain': 'small molecules',
- },
- 'ZINC_full': {
- 'database': 'tudataset',
- 'reference': '[31]',
- 'dataset_size': 249456,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 23.14,
- 'ave_edge_num': 24.91,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_full.zip',
- 'domain': 'small molecules',
- },
- 'ZINC_test': {
- 'database': 'tudataset',
- 'reference': '[31]',
- 'dataset_size': 5000,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 23.1,
- 'ave_edge_num': 24.83,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_test.zip',
- 'domain': 'small molecules',
- },
- 'ZINC_train': {
- 'database': 'tudataset',
- 'reference': '[31]',
- 'dataset_size': 220011,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 23.15,
- 'ave_edge_num': 24.91,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_train.zip',
- 'domain': 'small molecules',
- },
- 'ZINC_val': {
- 'database': 'tudataset',
- 'reference': '[31]',
- 'dataset_size': 24445,
- 'class_number': None,
- 'task_type': 'regression',
- 'ave_node_num': 23.13,
- 'ave_edge_num': 24.88,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_val.zip',
- 'domain': 'small molecules',
- },
-
- ### bioinformatics
- 'DD': {
- 'database': 'tudataset',
- 'reference': '[6,22]',
- 'dataset_size': 1178,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 284.32,
- 'ave_edge_num': 715.66,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DD.zip',
- 'domain': 'bioinformatics',
- },
- 'ENZYMES': {
- 'database': 'tudataset',
- 'reference': '[4,5]',
- 'dataset_size': 600,
- 'class_number': 6,
- 'task_type': 'classification',
- 'ave_node_num': 32.63,
- 'ave_edge_num': 62.14,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 18,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'http://www.chrsmrrs.com/graphkerneldatasets/ENZYMES.zip',
- 'domain': 'bioinformatics',
- },
- 'KKI': {
- 'database': 'tudataset',
- 'reference': '[26]',
- 'dataset_size': 83,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 26.96,
- 'ave_edge_num': 48.42,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/KKI.zip',
- 'domain': 'bioinformatics',
- },
- 'OHSU': {
- 'database': 'tudataset',
- 'reference': '[26]',
- 'dataset_size': 79,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 82.01,
- 'ave_edge_num': 199.66,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OHSU.zip',
- 'domain': 'bioinformatics',
- },
- 'Peking_1': {
- 'database': 'tudataset',
- 'reference': '[26]',
- 'dataset_size': 85,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 39.31,
- 'ave_edge_num': 77.35,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Peking_1.zip',
- 'domain': 'bioinformatics',
- },
- 'PROTEINS': {
- 'database': 'tudataset',
- 'reference': '[4,6]',
- 'dataset_size': 1113,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 39.06,
- 'ave_edge_num': 72.82,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 1,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PROTEINS.zip',
- 'domain': 'bioinformatics',
- },
- 'PROTEINS_full': {
- 'database': 'tudataset',
- 'reference': '[4,6]',
- 'dataset_size': 1113,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 39.06,
- 'ave_edge_num': 72.82,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 29,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PROTEINS_full.zip',
- 'domain': 'bioinformatics',
- },
-
- ### computer vision
- 'COIL-DEL': {
- 'database': 'tudataset',
- 'reference': '[16,18]',
- 'dataset_size': 3900,
- 'class_number': 100,
- 'task_type': 'classification',
- 'ave_node_num': 21.54,
- 'ave_edge_num': 54.24,
- 'node_labeled': False,
- 'edge_labeled': True,
- 'node_attr_dim': 2,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COIL-DEL.zip',
- 'domain': 'computer vision',
- },
- 'COIL-RAG': {
- 'database': 'tudataset',
- 'reference': '[16,18]',
- 'dataset_size': 3900,
- 'class_number': 100,
- 'task_type': 'classification',
- 'ave_node_num': 3.01,
- 'ave_edge_num': 3.02,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 64,
- 'geometry': None,
- 'edge_attr_dim': 1,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COIL-RAG.zip',
- 'domain': 'computer vision',
- },
- 'Cuneiform': {
- 'database': 'tudataset',
- 'reference': '[25]',
- 'dataset_size': 267,
- 'class_number': 30,
- 'task_type': 'classification',
- 'ave_node_num': 21.27,
- 'ave_edge_num': 44.8,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 3,
- 'geometry': '3D',
- 'edge_attr_dim': 2,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Cuneiform.zip',
- 'domain': 'computer vision',
- },
- 'Fingerprint': {
- 'database': 'tudataset',
- 'reference': '[16,19]',
- 'dataset_size': 2800,
- 'class_number': 4,
- 'task_type': 'classification',
- 'ave_node_num': 5.42,
- 'ave_edge_num': 4.42,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 2,
- 'geometry': '2D',
- 'edge_attr_dim': 2,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Fingerprint.zip',
- 'domain': 'computer vision',
- },
- 'FIRSTMM_DB': {
- 'database': 'tudataset',
- 'reference': '[11,12,13]',
- 'dataset_size': 41,
- 'class_number': 11,
- 'task_type': 'classification',
- 'ave_node_num': 1377.27,
- 'ave_edge_num': 3074.1,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 1,
- 'geometry': None,
- 'edge_attr_dim': 2,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/FIRSTMM_DB.zip',
- 'domain': 'computer vision',
- },
- 'Letter-high': {
- 'database': 'tudataset',
- 'reference': '[16]',
- 'dataset_size': 2250,
- 'class_number': 15,
- 'task_type': 'classification',
- 'ave_node_num': 4.67,
- 'ave_edge_num': 4.5,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 2,
- 'geometry': '2D',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-high.zip',
- 'domain': 'computer vision',
- },
- 'Letter-low': {
- 'database': 'tudataset',
- 'reference': '[16]',
- 'dataset_size': 2250,
- 'class_number': 15,
- 'task_type': 'classification',
- 'ave_node_num': 4.68,
- 'ave_edge_num': 3.13,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 2,
- 'geometry': '2D',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-low.zip',
- 'domain': 'computer vision',
- },
- 'Letter-med': {
- 'database': 'tudataset',
- 'reference': '[16]',
- 'dataset_size': 2250,
- 'class_number': 15,
- 'task_type': 'classification',
- 'ave_node_num': 4.67,
- 'ave_edge_num': 4.5,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 2,
- 'geometry': '2D',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-med.zip',
- 'domain': 'computer vision',
- },
- 'MSRC_9': {
- 'database': 'tudataset',
- 'reference': '[13]',
- 'dataset_size': 221,
- 'class_number': 8,
- 'task_type': 'classification',
- 'ave_node_num': 40.58,
- 'ave_edge_num': 97.94,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_9.zip',
- 'domain': 'computer vision',
- },
- 'MSRC_21': {
- 'database': 'tudataset',
- 'reference': '[13]',
- 'dataset_size': 563,
- 'class_number': 20,
- 'task_type': 'classification',
- 'ave_node_num': 77.52,
- 'ave_edge_num': 198.32,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_21.zip',
- 'domain': 'computer vision',
- },
- 'MSRC_21C': {
- 'database': 'tudataset',
- 'reference': '[13]',
- 'dataset_size': 209,
- 'class_number': 20,
- 'task_type': 'classification',
- 'ave_node_num': 40.28,
- 'ave_edge_num': 96.6,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_21C.zip',
- 'domain': 'computer vision',
- },
-
- ### social networks
- 'COLLAB': {
- 'database': 'tudataset',
- 'reference': '[14]',
- 'dataset_size': 5000,
- 'class_number': 3,
- 'task_type': 'classification',
- 'ave_node_num': 74.49,
- 'ave_edge_num': 2457.78,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COLLAB.zip',
- 'domain': 'social networks',
- },
- 'dblp_ct1': {
- 'database': 'tudataset',
- 'reference': '[32]',
- 'dataset_size': 755,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 52.87,
- 'ave_edge_num': 320.09,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 'temporal',
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/dblp_ct1.zip',
- 'domain': 'social networks',
- },
- 'dblp_ct2': {
- 'database': 'tudataset',
- 'reference': '[32]',
- 'dataset_size': 755,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 52.87,
- 'ave_edge_num': 320.09,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 'temporal',
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/dblp_ct2.zip',
- 'domain': 'social networks',
- },
- 'DBLP_v1': {
- 'database': 'tudataset',
- 'reference': '[26]',
- 'dataset_size': 19456,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 10.48,
- 'ave_edge_num': 19.65,
- 'node_labeled': True,
- 'edge_labeled': True,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DBLP_v1.zip',
- 'domain': 'social networks',
- },
- 'deezer_ego_nets': {
- 'database': 'tudataset',
- 'reference': '[30]',
- 'dataset_size': 9629,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 23.49,
- 'ave_edge_num': 65.25,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/deezer_ego_nets.zip',
- 'domain': 'social networks',
- },
- 'facebook_ct1': {
- 'database': 'tudataset',
- 'reference': '[32]',
- 'dataset_size': 995,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 95.72,
- 'ave_edge_num': 269.01,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 'temporal',
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/facebook_ct1.zip',
- 'domain': 'social networks',
- },
- 'facebook_ct2': {
- 'database': 'tudataset',
- 'reference': '[32]',
- 'dataset_size': 995,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 95.72,
- 'ave_edge_num': 269.01,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 'temporal',
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/facebook_ct2.zip',
- 'domain': 'social networks',
- },
- 'github_stargazers': {
- 'database': 'tudataset',
- 'reference': '[30]',
- 'dataset_size': 12725,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 113.79,
- 'ave_edge_num': 234.64,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/github_stargazers.zip',
- 'domain': 'social networks',
- },
- 'highschool_ct1': {
- 'database': 'tudataset',
- 'reference': '[32]',
- 'dataset_size': 180,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 52.32,
- 'ave_edge_num': 544.81,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 'temporal',
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/highschool_ct1.zip',
- 'domain': 'social networks',
- },
- 'highschool_ct2': {
- 'database': 'tudataset',
- 'reference': '[32]',
- 'dataset_size': 180,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 52.32,
- 'ave_edge_num': 544.81,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 'temporal',
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/highschool_ct2.zip',
- 'domain': 'social networks',
- },
- 'IMDB-BINARY': {
- 'database': 'tudataset',
- 'reference': '[14]',
- 'dataset_size': 1000,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 19.77,
- 'ave_edge_num': 96.53,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': '',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/IMDB-BINARY.zip',
- 'domain': 'social networks',
- },
- 'IMDB-MULTI': {
- 'database': 'tudataset',
- 'reference': '[14]',
- 'dataset_size': 1500,
- 'class_number': 3,
- 'task_type': 'classification',
- 'ave_node_num': 13.0,
- 'ave_edge_num': 65.94,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': '',
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/IMDB-MULTI.zip',
- 'domain': 'social networks',
- },
- 'infectious_ct1': {
- 'database': 'tudataset',
- 'reference': '[32]',
- 'dataset_size': 200,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 50.0,
- 'ave_edge_num': 459.72,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 'temporal',
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/infectious_ct1.zip',
- 'domain': 'social networks',
- },
- 'infectious_ct2': {
- 'database': 'tudataset',
- 'reference': '[32]',
- 'dataset_size': 200,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 50.0,
- 'ave_edge_num': 459.72,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 'temporal',
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/infectious_ct2.zip',
- 'domain': 'social networks',
- },
- 'mit_ct1': {
- 'database': 'tudataset',
- 'reference': '[32]',
- 'dataset_size': 97,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 20.0,
- 'ave_edge_num': 1469.15,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 'temporal',
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/mit_ct1.zip',
- 'domain': 'social networks',
- },
- 'mit_ct2': {
- 'database': 'tudataset',
- 'reference': '[32]',
- 'dataset_size': 97,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 20.0,
- 'ave_edge_num': 1469.15,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 'temporal',
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/mit_ct2.zip',
- 'domain': 'social networks',
- },
- 'REDDIT-BINARY': {
- 'database': 'tudataset',
- 'reference': '[14]',
- 'dataset_size': 2000,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 429.63,
- 'ave_edge_num': 497.75,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-BINARY.zip',
- 'domain': 'social networks',
- },
- 'REDDIT-MULTI-5K': {
- 'database': 'tudataset',
- 'reference': '[14]',
- 'dataset_size': 4999,
- 'class_number': 5,
- 'task_type': 'classification',
- 'ave_node_num': 508.52,
- 'ave_edge_num': 594.87,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-MULTI-5K.zip',
- 'domain': 'social networks',
- },
- 'REDDIT-MULTI-12K': {
- 'database': 'tudataset',
- 'reference': '[14]',
- 'dataset_size': 11929,
- 'class_number': 11,
- 'task_type': 'classification',
- 'ave_node_num': 391.41,
- 'ave_edge_num': 456.89,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-MULTI-12K.zip',
- 'domain': 'social networks',
- },
- 'reddit_threads': {
- 'database': 'tudataset',
- 'reference': '[30]',
- 'dataset_size': 203088,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 23.93,
- 'ave_edge_num': 24.99,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/reddit_threads.zip',
- 'domain': 'social networks',
- },
- 'tumblr_ct1': {
- 'database': 'tudataset',
- 'reference': '[32]',
- 'dataset_size': 373,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 53.11,
- 'ave_edge_num': 199.78,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 'temporal',
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/tumblr_ct1.zip',
- 'domain': 'social networks',
- },
- 'tumblr_ct2': {
- 'database': 'tudataset',
- 'reference': '[32]',
- 'dataset_size': 373,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 53.11,
- 'ave_edge_num': 199.78,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 'temporal',
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/tumblr_ct2.zip',
- 'domain': 'social networks',
- },
- 'twitch_egos': {
- 'database': 'tudataset',
- 'reference': '[30]',
- 'dataset_size': 127094,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 29.67,
- 'ave_edge_num': 86.59,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/twitch_egos.zip',
- 'domain': 'social networks',
- },
- 'TWITTER-Real-Graph-Partial': {
- 'database': 'tudataset',
- 'reference': '[26]',
- 'dataset_size': 144033,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 4.03,
- 'ave_edge_num': 4.98,
- 'node_labeled': True,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 1,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/TWITTER-Real-Graph-Partial.zip',
- 'domain': 'social networks',
- },
-
- ### synthetic
- 'COLORS-3': {
- 'database': 'tudataset',
- 'reference': '[27]',
- 'dataset_size': 10500,
- 'class_number': 11,
- 'task_type': 'classification',
- 'ave_node_num': 61.31,
- 'ave_edge_num': 91.03,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 4,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COLORS-3.zip',
- 'domain': 'synthetic',
- },
- 'SYNTHETIC': {
- 'database': 'tudataset',
- 'reference': '[3]',
- 'dataset_size': 300,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 100.0,
- 'ave_edge_num': 196.0,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 1,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SYNTHETIC.zip',
- 'domain': 'synthetic',
- },
- 'SYNTHETICnew': {
- 'database': 'tudataset',
- 'reference': '[3,10]',
- 'dataset_size': 300,
- 'class_number': 2,
- 'task_type': 'classification',
- 'ave_node_num': 100.0,
- 'ave_edge_num': 196.25,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 1,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SYNTHETICnew.zip',
- 'domain': 'synthetic',
- },
- 'Synthie': {
- 'database': 'tudataset',
- 'reference': '[21]',
- 'dataset_size': 400,
- 'class_number': 4,
- 'task_type': 'classification',
- 'ave_node_num': 95.0,
- 'ave_edge_num': 172.93,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 15,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Synthie.zip',
- 'domain': 'synthetic',
- },
- 'TRIANGLES': {
- 'database': 'tudataset',
- 'reference': '[27]',
- 'dataset_size': 45000,
- 'class_number': 10,
- 'task_type': 'classification',
- 'ave_node_num': 20.85,
- 'ave_edge_num': 32.74,
- 'node_labeled': False,
- 'edge_labeled': False,
- 'node_attr_dim': 0,
- 'geometry': None,
- 'edge_attr_dim': 0,
- 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/TRIANGLES.zip',
- 'domain': 'synthetic',
- },
- }
-
-
- DATASET_META = {**GREYC_META, **IAM_META, **TUDataset_META}
-
-
- def list_of_databases():
- """List names of all databases.
-
- Returns
- -------
- list
- The list of all databases.
- """
- return [i for i in DATABASES]
-
-
- def list_of_datasets():
- """List names of all datasets.
-
- Returns
- -------
- list
- The list of all datasets.
- """
- return [i for i in DATASET_META]
|