You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

metadata.py 65 kB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486
  1. #!/usr/bin/env python3
  2. # -*- coding: utf-8 -*-
  3. """
  4. Created on Tue Oct 20 14:25:49 2020
  5. @author: ljia
  6. """
  7. DATABASES = {
  8. 'greyc': 'https://brunl01.users.greyc.fr/CHEMISTRY/',
  9. 'iam': 'https://iapr-tc15.greyc.fr/IAM/',
  10. 'tudataset': 'http://graphlearning.io/docs/datasets/',
  11. }
  12. ### -------- database greyc -------- ###
  13. GREYC_META = {
  14. 'ACE': {
  15. 'database': 'greyc',
  16. 'reference': None,
  17. 'dataset_size': 32,
  18. 'class_number': 2,
  19. 'task_type': 'classification',
  20. 'ave_node_num': 52,
  21. 'ave_edge_num': None,
  22. 'node_labeled': None,
  23. 'edge_labeled': None,
  24. 'node_attr_dim': None,
  25. 'geometry': None,
  26. 'edge_attr_dim': None,
  27. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/ACEDataset.tar',
  28. 'domain': 'small molecules',
  29. 'train_valid_test': [],
  30. 'stereoisomerism': True,
  31. 'load_files': ['data.ds'],
  32. },
  33. 'Acyclic': {
  34. 'database': 'greyc',
  35. 'reference': None,
  36. 'dataset_size': 183,
  37. 'class_number': None,
  38. 'task_type': 'regression',
  39. 'ave_node_num': 8.15,
  40. 'ave_edge_num': 7.15,
  41. 'node_labeled': True,
  42. 'edge_labeled': False,
  43. 'node_attr_dim': 0,
  44. 'geometry': None,
  45. 'edge_attr_dim': 0,
  46. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/Acyclic.tar.gz',
  47. 'domain': 'small molecules',
  48. 'train_valid_test': None,
  49. 'stereoisomerism': False,
  50. 'load_files': ['dataset_bps.ds'],
  51. },
  52. 'AIDS_greyc': {
  53. 'database': 'greyc',
  54. 'reference': None,
  55. 'dataset_size': 2000,
  56. 'class_number': 2,
  57. 'task_type': 'classification',
  58. 'ave_node_num': 15.69,
  59. 'ave_edge_num': 16.20,
  60. 'node_labeled': True,
  61. 'edge_labeled': True,
  62. 'node_attr_dim': None,
  63. 'geometry': None,
  64. 'edge_attr_dim': None,
  65. 'url': 'https://iapr-tc15.greyc.fr/IAM/AIDS.zip',
  66. 'domain': 'small molecules',
  67. 'train_valid_test': ['data/train.cxl', 'data/valid.cxl', 'data/test.cxl',],
  68. 'stereoisomerism': False,
  69. 'load_files': ['data/'],
  70. },
  71. 'Alkane': {
  72. 'database': 'greyc',
  73. 'reference': None,
  74. 'dataset_size': 150,
  75. 'class_number': None,
  76. 'task_type': 'regression',
  77. 'ave_node_num': 8.87,
  78. 'ave_edge_num': 7.87,
  79. 'node_labeled': False,
  80. 'edge_labeled': False,
  81. 'node_attr_dim': 0,
  82. 'geometry': None,
  83. 'edge_attr_dim': 0,
  84. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/alkane_dataset.tar.gz',
  85. 'domain': 'small molecules',
  86. 'train_valid_test': None,
  87. 'stereoisomerism': False,
  88. 'load_files': ['dataset.ds', 'dataset_boiling_point_names.txt'],
  89. },
  90. 'Chiral': {
  91. 'database': 'greyc',
  92. 'reference': None,
  93. 'dataset_size': 35,
  94. 'class_number': None,
  95. 'task_type': 'regression',
  96. 'ave_node_num': 21.29,
  97. 'ave_edge_num': None,
  98. 'node_labeled': None,
  99. 'edge_labeled': None,
  100. 'node_attr_dim': None,
  101. 'geometry': None,
  102. 'edge_attr_dim': None,
  103. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/DatasetAcyclicChiral.tar',
  104. 'domain': 'small molecules',
  105. 'train_valid_test': [],
  106. 'stereoisomerism': True,
  107. 'load_files': ['data.txt'],
  108. 'extra_params': {'gformat': 'cml'}
  109. },
  110. 'MAO': {
  111. 'database': 'greyc',
  112. 'reference': None,
  113. 'dataset_size': 68,
  114. 'class_number': 2,
  115. 'task_type': 'classification',
  116. 'ave_node_num': 18.38,
  117. 'ave_edge_num': 19.63,
  118. 'node_labeled': True,
  119. 'edge_labeled': True,
  120. 'node_attr_dim': 0,
  121. 'geometry': None,
  122. 'edge_attr_dim': 0,
  123. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/mao.tgz',
  124. 'domain': 'small molecules',
  125. 'train_valid_test': None,
  126. 'stereoisomerism': False,
  127. 'load_files': ['dataset.ds'],
  128. },
  129. 'Monoterpenoides': {
  130. 'database': 'greyc',
  131. 'reference': None,
  132. 'dataset_size': 382,
  133. 'class_number': 10,
  134. 'task_type': 'classification',
  135. 'ave_node_num': 10,
  136. 'ave_edge_num': None,
  137. 'node_labeled': None,
  138. 'edge_labeled': None,
  139. 'node_attr_dim': None,
  140. 'geometry': None,
  141. 'edge_attr_dim': None,
  142. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/monoterpenoides.tar.gz',
  143. 'domain': 'small molecules',
  144. 'train_valid_test': None,
  145. 'stereoisomerism': False,
  146. 'load_files': ['dataset_10+.ds'],
  147. },
  148. 'PAH': {
  149. 'database': 'greyc',
  150. 'reference': None,
  151. 'dataset_size': 94,
  152. 'class_number': 2,
  153. 'task_type': 'classification',
  154. 'ave_node_num': 20.7,
  155. 'ave_edge_num': 24.43,
  156. 'node_labeled': False,
  157. 'edge_labeled': False,
  158. 'node_attr_dim': 0,
  159. 'geometry': None,
  160. 'edge_attr_dim': 0,
  161. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/PAH.tar.gz',
  162. 'domain': 'small molecules',
  163. 'train_valid_test': ['trainset_0.ds', None, 'testset_0.ds'],
  164. 'stereoisomerism': False,
  165. 'load_files': [['trainset_0.ds', 'testset_0.ds']],
  166. },
  167. 'PTC': {
  168. 'database': 'greyc',
  169. 'reference': None,
  170. 'dataset_size': 416,
  171. 'class_number': None,
  172. 'task_type': 'classification',
  173. 'ave_node_num': 14.4,
  174. 'ave_edge_num': None,
  175. 'node_labeled': None,
  176. 'edge_labeled': None,
  177. 'node_attr_dim': None,
  178. 'geometry': None,
  179. 'edge_attr_dim': None,
  180. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/ptc.tgz',
  181. 'domain': 'small molecules',
  182. 'train_valid_test': None,
  183. 'stereoisomerism': False,
  184. 'load_files': [],
  185. 'extra_info': 'This dataset has test and train datasets. Select gender between mm, fm, mr, fr. \ndataloader = DataLoader(\'Ptc\',root = ..., option = \'mm\') \ntest,train = dataloader.dataset \nGs_test, y_test = test \nGs_train_, y_train = train',
  186. },
  187. 'Steroid': {
  188. 'database': 'greyc',
  189. 'reference': None,
  190. 'dataset_size': 64,
  191. 'class_number': None,
  192. 'task_type': 'regression',
  193. 'ave_node_num': 75.11,
  194. 'ave_edge_num': None,
  195. 'node_labeled': None,
  196. 'edge_labeled': None,
  197. 'node_attr_dim': None,
  198. 'geometry': None,
  199. 'edge_attr_dim': None,
  200. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/SteroidDataset.tar',
  201. 'domain': 'small molecules',
  202. 'train_valid_test': ['trainset_0.ds', None, 'testset_0.ds'],
  203. 'stereoisomerism': False,
  204. 'load_files': [],
  205. },
  206. 'Vitamin_D': {
  207. 'database': 'greyc',
  208. 'reference': None,
  209. 'dataset_size': 69,
  210. 'class_number': None,
  211. 'task_type': 'regression',
  212. 'ave_node_num': 76.91,
  213. 'ave_edge_num': None,
  214. 'node_labeled': None,
  215. 'edge_labeled': None,
  216. 'node_attr_dim': None,
  217. 'geometry': None,
  218. 'edge_attr_dim': None,
  219. 'url': 'https://brunl01.users.greyc.fr/CHEMISTRY/DatasetVitamin.tar',
  220. 'domain': 'small molecules',
  221. 'train_valid_test': [],
  222. 'stereoisomerism': True,
  223. 'load_files': [],
  224. },
  225. }
  226. ### -------- database iam -------- ###
  227. # @todo: several datasets in this database are included in TUDataset. However they do not include train/valid/test sets.
  228. IAM_META = {
  229. 'GREC': {
  230. 'database': 'iam',
  231. 'reference': None,
  232. 'dataset_size': None,
  233. 'class_number': None,
  234. 'task_type': None,
  235. 'ave_node_num': None,
  236. 'ave_edge_num': None,
  237. 'node_labeled': None,
  238. 'edge_labeled': None,
  239. 'node_attr_dim': None,
  240. 'geometry': None,
  241. 'edge_attr_dim': None,
  242. 'url': 'https://iapr-tc15.greyc.fr/IAM/GREC.zip',
  243. 'domain': None,
  244. 'train_valid_test': ['data/test.cxl','data/train.cxl', 'data/valid.cxl'],
  245. 'load_files': [],
  246. },
  247. 'Web': {
  248. 'database': 'iam',
  249. 'reference': None,
  250. 'dataset_size': None,
  251. 'class_number': None,
  252. 'task_type': None,
  253. 'ave_node_num': None,
  254. 'ave_edge_num': None,
  255. 'node_labeled': None,
  256. 'edge_labeled': None,
  257. 'node_attr_dim': None,
  258. 'geometry': None,
  259. 'edge_attr_dim': None,
  260. 'url': 'https://iapr-tc15.greyc.fr/IAM/Web.zip',
  261. 'domain': None,
  262. 'train_valid_test': ['data/test.cxl', 'data/train.cxl', 'data/valid.cxl'],
  263. 'load_files': [],
  264. },
  265. }
  266. ### -------- database tudataset -------- ###
  267. TUDataset_META = {
  268. ### small molecules
  269. 'AIDS': {
  270. 'database': 'tudataset',
  271. 'reference': '[16,17]',
  272. 'dataset_size': 2000,
  273. 'class_number': 2,
  274. 'task_type': 'classification',
  275. 'ave_node_num': 15.69,
  276. 'ave_edge_num': 16.2,
  277. 'node_labeled': True,
  278. 'edge_labeled': True,
  279. 'node_attr_dim': 4,
  280. 'geometry': None,
  281. 'edge_attr_dim': 0,
  282. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/AIDS.zip',
  283. 'domain': 'small molecules',
  284. },
  285. 'alchemy_full': {
  286. 'database': 'tudataset',
  287. 'reference': '[29]',
  288. 'dataset_size': 202579,
  289. 'class_number': None,
  290. 'task_type': 'regression',
  291. 'ave_node_num': 10.1,
  292. 'ave_edge_num': 10.44,
  293. 'node_labeled': True,
  294. 'edge_labeled': True,
  295. 'node_attr_dim': 3,
  296. 'geometry': '3D, RI',
  297. 'edge_attr_dim': 0,
  298. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/alchemy_full.zip',
  299. 'domain': 'small molecules',
  300. },
  301. 'aspirin': {
  302. 'database': 'tudataset',
  303. 'reference': '[36]',
  304. 'dataset_size': 111763,
  305. 'class_number': None,
  306. 'task_type': 'regression',
  307. 'ave_node_num': 21.0,
  308. 'ave_edge_num': 151.52,
  309. 'node_labeled': True,
  310. 'edge_labeled': False,
  311. 'node_attr_dim': 6,
  312. 'geometry': '3D, RI',
  313. 'edge_attr_dim': 0,
  314. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/aspirin.zip',
  315. 'domain': 'small molecules',
  316. },
  317. 'benzene': {
  318. 'database': 'tudataset',
  319. 'reference': '[36]',
  320. 'dataset_size': 527984,
  321. 'class_number': None,
  322. 'task_type': 'regression',
  323. 'ave_node_num': 12.0,
  324. 'ave_edge_num': 64.94,
  325. 'node_labeled': True,
  326. 'edge_labeled': False,
  327. 'node_attr_dim': 6,
  328. 'geometry': '3D, RI',
  329. 'edge_attr_dim': 0,
  330. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/benzene.zip',
  331. 'domain': 'small molecules',
  332. },
  333. 'BZR': {
  334. 'database': 'tudataset',
  335. 'reference': '[7]',
  336. 'dataset_size': 405,
  337. 'class_number': 2,
  338. 'task_type': 'classification',
  339. 'ave_node_num': 35.75,
  340. 'ave_edge_num': 38.36,
  341. 'node_labeled': True,
  342. 'edge_labeled': False,
  343. 'node_attr_dim': 3,
  344. 'geometry': '3D, RI',
  345. 'edge_attr_dim': 0,
  346. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/BZR.zip',
  347. 'domain': 'small molecules',
  348. },
  349. 'BZR_MD': {
  350. 'database': 'tudataset',
  351. 'reference': '[7,23]',
  352. 'dataset_size': 306,
  353. 'class_number': 2,
  354. 'task_type': 'classification',
  355. 'ave_node_num': 21.3,
  356. 'ave_edge_num': 225.06,
  357. 'node_labeled': True,
  358. 'edge_labeled': True,
  359. 'node_attr_dim': 0,
  360. 'geometry': None,
  361. 'edge_attr_dim': 1,
  362. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/BZR_MD.zip',
  363. 'domain': 'small molecules',
  364. },
  365. 'COX2': {
  366. 'database': 'tudataset',
  367. 'reference': '[7]',
  368. 'dataset_size': 467,
  369. 'class_number': 2,
  370. 'task_type': 'classification',
  371. 'ave_node_num': 41.22,
  372. 'ave_edge_num': 43.45,
  373. 'node_labeled': True,
  374. 'edge_labeled': False,
  375. 'node_attr_dim': 3,
  376. 'geometry': '3D, RI',
  377. 'edge_attr_dim': 0,
  378. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COX2.zip',
  379. 'domain': 'small molecules',
  380. },
  381. 'COX2_MD': {
  382. 'database': 'tudataset',
  383. 'reference': '[7,23]',
  384. 'dataset_size': 303,
  385. 'class_number': 2,
  386. 'task_type': 'classification',
  387. 'ave_node_num': 26.28,
  388. 'ave_edge_num': 335.12,
  389. 'node_labeled': True,
  390. 'edge_labeled': True,
  391. 'node_attr_dim': 0,
  392. 'geometry': None,
  393. 'edge_attr_dim': 1,
  394. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COX2_MD.zip',
  395. 'domain': 'small molecules',
  396. },
  397. 'DHFR': {
  398. 'database': 'tudataset',
  399. 'reference': '[7]',
  400. 'dataset_size': 467,
  401. 'class_number': 2,
  402. 'task_type': 'classification',
  403. 'ave_node_num': 42.43,
  404. 'ave_edge_num': 44.54,
  405. 'node_labeled': True,
  406. 'edge_labeled': False,
  407. 'node_attr_dim': 3,
  408. 'geometry': '3D, RI',
  409. 'edge_attr_dim': 0,
  410. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DHFR.zip',
  411. 'domain': 'small molecules',
  412. },
  413. 'DHFR_MD': {
  414. 'database': 'tudataset',
  415. 'reference': '[7,23]',
  416. 'dataset_size': 393,
  417. 'class_number': 2,
  418. 'task_type': 'classification',
  419. 'ave_node_num': 23.87,
  420. 'ave_edge_num': 283.01,
  421. 'node_labeled': True,
  422. 'edge_labeled': True,
  423. 'node_attr_dim': 0,
  424. 'geometry': None,
  425. 'edge_attr_dim': 1,
  426. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DHFR_MD.zip',
  427. 'domain': 'small molecules',
  428. },
  429. 'ER_MD': {
  430. 'database': 'tudataset',
  431. 'reference': '[7,23]',
  432. 'dataset_size': 446,
  433. 'class_number': 2,
  434. 'task_type': 'classification',
  435. 'ave_node_num': 21.33,
  436. 'ave_edge_num': 234.85,
  437. 'node_labeled': True,
  438. 'edge_labeled': True,
  439. 'node_attr_dim': 0,
  440. 'geometry': None,
  441. 'edge_attr_dim': 1,
  442. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ER_MD.zip',
  443. 'domain': 'small molecules',
  444. },
  445. 'ethanol': {
  446. 'database': 'tudataset',
  447. 'reference': '[36]',
  448. 'dataset_size': 455093,
  449. 'class_number': None,
  450. 'task_type': 'regression',
  451. 'ave_node_num': 9.0,
  452. 'ave_edge_num': 36.0,
  453. 'node_labeled': True,
  454. 'edge_labeled': False,
  455. 'node_attr_dim': 6,
  456. 'geometry': '3D, RI',
  457. 'edge_attr_dim': 0,
  458. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ethanol.zip',
  459. 'domain': 'small molecules',
  460. },
  461. 'FRANKENSTEIN': {
  462. 'database': 'tudataset',
  463. 'reference': '[15]',
  464. 'dataset_size': 4337,
  465. 'class_number': 2,
  466. 'task_type': 'classification',
  467. 'ave_node_num': 16.9,
  468. 'ave_edge_num': 17.88,
  469. 'node_labeled': False,
  470. 'edge_labeled': False,
  471. 'node_attr_dim': 780,
  472. 'geometry': None,
  473. 'edge_attr_dim': 0,
  474. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/FRANKENSTEIN.zip',
  475. 'domain': 'small molecules',
  476. },
  477. 'malonaldehyde': {
  478. 'database': 'tudataset',
  479. 'reference': '[36]',
  480. 'dataset_size': 893238,
  481. 'class_number': None,
  482. 'task_type': 'regression',
  483. 'ave_node_num': 9.0,
  484. 'ave_edge_num': 36.0,
  485. 'node_labeled': True,
  486. 'edge_labeled': False,
  487. 'node_attr_dim': 6,
  488. 'geometry': '3D, RI',
  489. 'edge_attr_dim': 0,
  490. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/malonaldehyde.zip',
  491. 'domain': 'small molecules',
  492. },
  493. 'MCF-7': {
  494. 'database': 'tudataset',
  495. 'reference': '[28]',
  496. 'dataset_size': 27770,
  497. 'class_number': 2,
  498. 'task_type': 'classification',
  499. 'ave_node_num': 26.39,
  500. 'ave_edge_num': 28.52,
  501. 'node_labeled': True,
  502. 'edge_labeled': True,
  503. 'node_attr_dim': 0,
  504. 'geometry': None,
  505. 'edge_attr_dim': 0,
  506. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MCF-7.zip',
  507. 'domain': 'small molecules',
  508. },
  509. 'MCF-7H': {
  510. 'database': 'tudataset',
  511. 'reference': '[28]',
  512. 'dataset_size': 27770,
  513. 'class_number': 2,
  514. 'task_type': 'classification',
  515. 'ave_node_num': 47.3,
  516. 'ave_edge_num': 49.43,
  517. 'node_labeled': True,
  518. 'edge_labeled': True,
  519. 'node_attr_dim': 0,
  520. 'geometry': None,
  521. 'edge_attr_dim': 0,
  522. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MCF-7H.zip',
  523. 'domain': 'small molecules',
  524. },
  525. 'MOLT-4': {
  526. 'database': 'tudataset',
  527. 'reference': '[28]',
  528. 'dataset_size': 39765,
  529. 'class_number': 2,
  530. 'task_type': 'classification',
  531. 'ave_node_num': 26.09,
  532. 'ave_edge_num': 28.13,
  533. 'node_labeled': True,
  534. 'edge_labeled': True,
  535. 'node_attr_dim': 0,
  536. 'geometry': None,
  537. 'edge_attr_dim': 0,
  538. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MOLT-4.zip',
  539. 'domain': 'small molecules',
  540. },
  541. 'MOLT-4H': {
  542. 'database': 'tudataset',
  543. 'reference': '[28]',
  544. 'dataset_size': 39765,
  545. 'class_number': 2,
  546. 'task_type': 'classification',
  547. 'ave_node_num': 46.7,
  548. 'ave_edge_num': 48.73,
  549. 'node_labeled': True,
  550. 'edge_labeled': True,
  551. 'node_attr_dim': 0,
  552. 'geometry': None,
  553. 'edge_attr_dim': 0,
  554. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MOLT-4H.zip',
  555. 'domain': 'small molecules',
  556. },
  557. 'Mutagenicity': {
  558. 'database': 'tudataset',
  559. 'reference': '[16,20]',
  560. 'dataset_size': 4337,
  561. 'class_number': 2,
  562. 'task_type': 'classification',
  563. 'ave_node_num': 30.32,
  564. 'ave_edge_num': 30.77,
  565. 'node_labeled': True,
  566. 'edge_labeled': True,
  567. 'node_attr_dim': 0,
  568. 'geometry': None,
  569. 'edge_attr_dim': 0,
  570. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Mutagenicity.zip',
  571. 'domain': 'small molecules',
  572. },
  573. 'MUTAG': {
  574. 'database': 'tudataset',
  575. 'reference': '[1,23]',
  576. 'dataset_size': 188,
  577. 'class_number': 2,
  578. 'task_type': 'classification',
  579. 'ave_node_num': 17.93,
  580. 'ave_edge_num': 19.79,
  581. 'node_labeled': True,
  582. 'edge_labeled': True,
  583. 'node_attr_dim': 0,
  584. 'geometry': None,
  585. 'edge_attr_dim': 0,
  586. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MUTAG.zip',
  587. 'domain': 'small molecules',
  588. },
  589. 'naphthalene': {
  590. 'database': 'tudataset',
  591. 'reference': '[36]',
  592. 'dataset_size': 226256,
  593. 'class_number': None,
  594. 'task_type': 'regression',
  595. 'ave_node_num': 18.0,
  596. 'ave_edge_num': 127.37,
  597. 'node_labeled': True,
  598. 'edge_labeled': False,
  599. 'node_attr_dim': 6,
  600. 'geometry': '3D, RI',
  601. 'edge_attr_dim': 0,
  602. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/naphthalene.zip',
  603. 'domain': 'small molecules',
  604. },
  605. 'NCI1': {
  606. 'database': 'tudataset',
  607. 'reference': '[8,9,22]',
  608. 'dataset_size': 4110,
  609. 'class_number': 2,
  610. 'task_type': 'classification',
  611. 'ave_node_num': 29.87,
  612. 'ave_edge_num': 32.3,
  613. 'node_labeled': True,
  614. 'edge_labeled': False,
  615. 'node_attr_dim': 0,
  616. 'geometry': None,
  617. 'edge_attr_dim': 0,
  618. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI1.zip',
  619. 'domain': 'small molecules',
  620. },
  621. 'NCI109': {
  622. 'database': 'tudataset',
  623. 'reference': '[8,9,22]',
  624. 'dataset_size': 4127,
  625. 'class_number': 2,
  626. 'task_type': 'classification',
  627. 'ave_node_num': 29.68,
  628. 'ave_edge_num': 32.13,
  629. 'node_labeled': True,
  630. 'edge_labeled': False,
  631. 'node_attr_dim': 0,
  632. 'geometry': None,
  633. 'edge_attr_dim': 0,
  634. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI109.zip',
  635. 'domain': 'small molecules',
  636. },
  637. 'NCI-H23': {
  638. 'database': 'tudataset',
  639. 'reference': '[28]',
  640. 'dataset_size': 40353,
  641. 'class_number': 2,
  642. 'task_type': 'classification',
  643. 'ave_node_num': 26.07,
  644. 'ave_edge_num': 28.1,
  645. 'node_labeled': True,
  646. 'edge_labeled': True,
  647. 'node_attr_dim': 0,
  648. 'geometry': None,
  649. 'edge_attr_dim': 0,
  650. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI-H23.zip',
  651. 'domain': 'small molecules',
  652. },
  653. 'NCI-H23H': {
  654. 'database': 'tudataset',
  655. 'reference': '[28]',
  656. 'dataset_size': 40353,
  657. 'class_number': 2,
  658. 'task_type': 'classification',
  659. 'ave_node_num': 46.67,
  660. 'ave_edge_num': 48.69,
  661. 'node_labeled': True,
  662. 'edge_labeled': True,
  663. 'node_attr_dim': 0,
  664. 'geometry': None,
  665. 'edge_attr_dim': 0,
  666. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/NCI-H23H.zip',
  667. 'domain': 'small molecules',
  668. },
  669. 'OVCAR-8': {
  670. 'database': 'tudataset',
  671. 'reference': '[28]',
  672. 'dataset_size': 40516,
  673. 'class_number': 2,
  674. 'task_type': 'classification',
  675. 'ave_node_num': 26.07,
  676. 'ave_edge_num': 28.1,
  677. 'node_labeled': True,
  678. 'edge_labeled': True,
  679. 'node_attr_dim': 0,
  680. 'geometry': None,
  681. 'edge_attr_dim': 0,
  682. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OVCAR-8.zip',
  683. 'domain': 'small molecules',
  684. },
  685. 'OVCAR-8H': {
  686. 'database': 'tudataset',
  687. 'reference': '[28]',
  688. 'dataset_size': 40516,
  689. 'class_number': 2,
  690. 'task_type': 'classification',
  691. 'ave_node_num': 46.67,
  692. 'ave_edge_num': 48.7,
  693. 'node_labeled': True,
  694. 'edge_labeled': True,
  695. 'node_attr_dim': 0,
  696. 'geometry': None,
  697. 'edge_attr_dim': 0,
  698. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OVCAR-8H.zip',
  699. 'domain': 'small molecules',
  700. },
  701. 'P388': {
  702. 'database': 'tudataset',
  703. 'reference': '[28]',
  704. 'dataset_size': 41472,
  705. 'class_number': 2,
  706. 'task_type': 'classification',
  707. 'ave_node_num': 22.11,
  708. 'ave_edge_num': 23.55,
  709. 'node_labeled': True,
  710. 'edge_labeled': True,
  711. 'node_attr_dim': 0,
  712. 'geometry': None,
  713. 'edge_attr_dim': 0,
  714. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/P388.zip',
  715. 'domain': 'small molecules',
  716. },
  717. 'P388H': {
  718. 'database': 'tudataset',
  719. 'reference': '[28]',
  720. 'dataset_size': 41472,
  721. 'class_number': 2,
  722. 'task_type': 'classification',
  723. 'ave_node_num': 40.44,
  724. 'ave_edge_num': 41.88,
  725. 'node_labeled': True,
  726. 'edge_labeled': True,
  727. 'node_attr_dim': 0,
  728. 'geometry': None,
  729. 'edge_attr_dim': 0,
  730. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/P388H.zip',
  731. 'domain': 'small molecules',
  732. },
  733. 'PC-3': {
  734. 'database': 'tudataset',
  735. 'reference': '[28]',
  736. 'dataset_size': 27509,
  737. 'class_number': 2,
  738. 'task_type': 'classification',
  739. 'ave_node_num': 26.35,
  740. 'ave_edge_num': 28.49,
  741. 'node_labeled': True,
  742. 'edge_labeled': True,
  743. 'node_attr_dim': 0,
  744. 'geometry': None,
  745. 'edge_attr_dim': 0,
  746. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PC-3.zip',
  747. 'domain': 'small molecules',
  748. },
  749. 'PC-3H': {
  750. 'database': 'tudataset',
  751. 'reference': '[28]',
  752. 'dataset_size': 27509,
  753. 'class_number': 2,
  754. 'task_type': 'classification',
  755. 'ave_node_num': 47.19,
  756. 'ave_edge_num': 49.32,
  757. 'node_labeled': True,
  758. 'edge_labeled': True,
  759. 'node_attr_dim': 0,
  760. 'geometry': None,
  761. 'edge_attr_dim': 0,
  762. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PC-3H.zip',
  763. 'domain': 'small molecules',
  764. },
  765. 'PTC_FM': {
  766. 'database': 'tudataset',
  767. 'reference': '[2,23]',
  768. 'dataset_size': 349,
  769. 'class_number': 2,
  770. 'task_type': 'classification',
  771. 'ave_node_num': 14.11,
  772. 'ave_edge_num': 14.48,
  773. 'node_labeled': True,
  774. 'edge_labeled': True,
  775. 'node_attr_dim': 0,
  776. 'geometry': None,
  777. 'edge_attr_dim': 0,
  778. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_FM.zip',
  779. 'domain': 'small molecules',
  780. },
  781. 'PTC_FR': {
  782. 'database': 'tudataset',
  783. 'reference': '[2,23]',
  784. 'dataset_size': 351,
  785. 'class_number': 2,
  786. 'task_type': 'classification',
  787. 'ave_node_num': 14.56,
  788. 'ave_edge_num': 15.0,
  789. 'node_labeled': True,
  790. 'edge_labeled': True,
  791. 'node_attr_dim': 0,
  792. 'geometry': None,
  793. 'edge_attr_dim': 0,
  794. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_FR.zip',
  795. 'domain': 'small molecules',
  796. },
  797. 'PTC_MM': {
  798. 'database': 'tudataset',
  799. 'reference': '[2,23]',
  800. 'dataset_size': 336,
  801. 'class_number': 2,
  802. 'task_type': 'classification',
  803. 'ave_node_num': 13.97,
  804. 'ave_edge_num': 14.32,
  805. 'node_labeled': True,
  806. 'edge_labeled': True,
  807. 'node_attr_dim': 0,
  808. 'geometry': None,
  809. 'edge_attr_dim': 0,
  810. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_MM.zip',
  811. 'domain': 'small molecules',
  812. },
  813. 'PTC_MR': {
  814. 'database': 'tudataset',
  815. 'reference': '[2,23]',
  816. 'dataset_size': 344,
  817. 'class_number': 2,
  818. 'task_type': 'classification',
  819. 'ave_node_num': 14.29,
  820. 'ave_edge_num': 14.69,
  821. 'node_labeled': True,
  822. 'edge_labeled': True,
  823. 'node_attr_dim': 0,
  824. 'geometry': None,
  825. 'edge_attr_dim': 0,
  826. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PTC_MR.zip',
  827. 'domain': 'small molecules',
  828. },
  829. 'QM9': {
  830. 'database': 'tudataset',
  831. 'reference': '[33,34,35]',
  832. 'dataset_size': 129433,
  833. 'class_number': None,
  834. 'task_type': 'regression',
  835. 'ave_node_num': 18.03,
  836. 'ave_edge_num': 18.63,
  837. 'node_labeled': False,
  838. 'edge_labeled': False,
  839. 'node_attr_dim': 16,
  840. 'geometry': '3D, RI',
  841. 'edge_attr_dim': 4,
  842. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/QM9.zip',
  843. 'domain': 'small molecules',
  844. },
  845. 'salicylic_acid': {
  846. 'database': 'tudataset',
  847. 'reference': '[36]',
  848. 'dataset_size': 220232,
  849. 'class_number': None,
  850. 'task_type': 'regression',
  851. 'ave_node_num': 16.0,
  852. 'ave_edge_num': 104.13,
  853. 'node_labeled': True,
  854. 'edge_labeled': False,
  855. 'node_attr_dim': 6,
  856. 'geometry': '3D, RI',
  857. 'edge_attr_dim': 0,
  858. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/salicylic_acid.zip',
  859. 'domain': 'small molecules',
  860. },
  861. 'SF-295': {
  862. 'database': 'tudataset',
  863. 'reference': '[28]',
  864. 'dataset_size': 40271,
  865. 'class_number': 2,
  866. 'task_type': 'classification',
  867. 'ave_node_num': 26.06,
  868. 'ave_edge_num': 28.08,
  869. 'node_labeled': True,
  870. 'edge_labeled': True,
  871. 'node_attr_dim': 0,
  872. 'geometry': None,
  873. 'edge_attr_dim': 0,
  874. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SF-295.zip',
  875. 'domain': 'small molecules',
  876. },
  877. 'SF-295H': {
  878. 'database': 'tudataset',
  879. 'reference': '[28]',
  880. 'dataset_size': 40271,
  881. 'class_number': 2,
  882. 'task_type': 'classification',
  883. 'ave_node_num': 46.65,
  884. 'ave_edge_num': 48.68,
  885. 'node_labeled': True,
  886. 'edge_labeled': True,
  887. 'node_attr_dim': 0,
  888. 'geometry': None,
  889. 'edge_attr_dim': 0,
  890. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SF-295H.zip',
  891. 'domain': 'small molecules',
  892. },
  893. 'SN12C': {
  894. 'database': 'tudataset',
  895. 'reference': '[28]',
  896. 'dataset_size': 40004,
  897. 'class_number': 2,
  898. 'task_type': 'classification',
  899. 'ave_node_num': 26.08,
  900. 'ave_edge_num': 28.11,
  901. 'node_labeled': True,
  902. 'edge_labeled': True,
  903. 'node_attr_dim': 0,
  904. 'geometry': None,
  905. 'edge_attr_dim': 0,
  906. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SN12C.zip',
  907. 'domain': 'small molecules',
  908. },
  909. 'SN12CH': {
  910. 'database': 'tudataset',
  911. 'reference': '[28]',
  912. 'dataset_size': 40004,
  913. 'class_number': 2,
  914. 'task_type': 'classification',
  915. 'ave_node_num': 46.69,
  916. 'ave_edge_num': 48.71,
  917. 'node_labeled': True,
  918. 'edge_labeled': True,
  919. 'node_attr_dim': 0,
  920. 'geometry': None,
  921. 'edge_attr_dim': 0,
  922. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SN12CH.zip',
  923. 'domain': 'small molecules',
  924. },
  925. 'SW-620': {
  926. 'database': 'tudataset',
  927. 'reference': '[28]',
  928. 'dataset_size': 40532,
  929. 'class_number': 2,
  930. 'task_type': 'classification',
  931. 'ave_node_num': 26.05,
  932. 'ave_edge_num': 28.08,
  933. 'node_labeled': True,
  934. 'edge_labeled': True,
  935. 'node_attr_dim': 0,
  936. 'geometry': None,
  937. 'edge_attr_dim': 0,
  938. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SW-620.zip',
  939. 'domain': 'small molecules',
  940. },
  941. 'SW-620H': {
  942. 'database': 'tudataset',
  943. 'reference': '[28]',
  944. 'dataset_size': 40532,
  945. 'class_number': 2,
  946. 'task_type': 'classification',
  947. 'ave_node_num': 46.62,
  948. 'ave_edge_num': 48.65,
  949. 'node_labeled': True,
  950. 'edge_labeled': True,
  951. 'node_attr_dim': 0,
  952. 'geometry': None,
  953. 'edge_attr_dim': 0,
  954. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SW-620H.zip',
  955. 'domain': 'small molecules',
  956. },
  957. 'toluene': {
  958. 'database': 'tudataset',
  959. 'reference': '[36]',
  960. 'dataset_size': 342791,
  961. 'class_number': None,
  962. 'task_type': 'regression',
  963. 'ave_node_num': 15.0,
  964. 'ave_edge_num': 96.15,
  965. 'node_labeled': True,
  966. 'edge_labeled': False,
  967. 'node_attr_dim': 6,
  968. 'geometry': '3D, RI',
  969. 'edge_attr_dim': 0,
  970. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/toluene.zip',
  971. 'domain': 'small molecules',
  972. },
  973. 'Tox21_AhR_training': {
  974. 'database': 'tudataset',
  975. 'reference': '[24]',
  976. 'dataset_size': 8169,
  977. 'class_number': 2,
  978. 'task_type': 'classification',
  979. 'ave_node_num': 18.09,
  980. 'ave_edge_num': 18.5,
  981. 'node_labeled': True,
  982. 'edge_labeled': True,
  983. 'node_attr_dim': 0,
  984. 'geometry': None,
  985. 'edge_attr_dim': 0,
  986. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_training.zip',
  987. 'domain': 'small molecules',
  988. },
  989. 'Tox21_AhR_testing': {
  990. 'database': 'tudataset',
  991. 'reference': '[24]',
  992. 'dataset_size': 272,
  993. 'class_number': 2,
  994. 'task_type': 'classification',
  995. 'ave_node_num': 22.13,
  996. 'ave_edge_num': 23.05,
  997. 'node_labeled': True,
  998. 'edge_labeled': True,
  999. 'node_attr_dim': 0,
  1000. 'geometry': None,
  1001. 'edge_attr_dim': 0,
  1002. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_testing.zip',
  1003. 'domain': 'small molecules',
  1004. },
  1005. 'Tox21_AhR_evaluation': {
  1006. 'database': 'tudataset',
  1007. 'reference': '[24]',
  1008. 'dataset_size': 607,
  1009. 'class_number': 2,
  1010. 'task_type': 'classification',
  1011. 'ave_node_num': 17.64,
  1012. 'ave_edge_num': 18.06,
  1013. 'node_labeled': True,
  1014. 'edge_labeled': True,
  1015. 'node_attr_dim': 0,
  1016. 'geometry': None,
  1017. 'edge_attr_dim': 0,
  1018. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AhR_evaluation.zip',
  1019. 'domain': 'small molecules',
  1020. },
  1021. 'Tox21_AR_training': {
  1022. 'database': 'tudataset',
  1023. 'reference': '[24]',
  1024. 'dataset_size': 9362,
  1025. 'class_number': 2,
  1026. 'task_type': 'classification',
  1027. 'ave_node_num': 18.39,
  1028. 'ave_edge_num': 18.84,
  1029. 'node_labeled': True,
  1030. 'edge_labeled': True,
  1031. 'node_attr_dim': 0,
  1032. 'geometry': None,
  1033. 'edge_attr_dim': 0,
  1034. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_training.zip',
  1035. 'domain': 'small molecules',
  1036. },
  1037. 'Tox21_AR_testing': {
  1038. 'database': 'tudataset',
  1039. 'reference': '[24]',
  1040. 'dataset_size': 292,
  1041. 'class_number': 2,
  1042. 'task_type': 'classification',
  1043. 'ave_node_num': 22.35,
  1044. 'ave_edge_num': 23.32,
  1045. 'node_labeled': True,
  1046. 'edge_labeled': True,
  1047. 'node_attr_dim': 0,
  1048. 'geometry': None,
  1049. 'edge_attr_dim': 0,
  1050. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_testing.zip',
  1051. 'domain': 'small molecules',
  1052. },
  1053. 'Tox21_AR_evaluation': {
  1054. 'database': 'tudataset',
  1055. 'reference': '[24]',
  1056. 'dataset_size': 585,
  1057. 'class_number': 2,
  1058. 'task_type': 'classification',
  1059. 'ave_node_num': 17.99,
  1060. 'ave_edge_num': 18.45,
  1061. 'node_labeled': True,
  1062. 'edge_labeled': True,
  1063. 'node_attr_dim': 0,
  1064. 'geometry': None,
  1065. 'edge_attr_dim': 0,
  1066. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR_evaluation.zip',
  1067. 'domain': 'small molecules',
  1068. },
  1069. 'Tox21_AR-LBD_training': {
  1070. 'database': 'tudataset',
  1071. 'reference': '[24]',
  1072. 'dataset_size': 8599,
  1073. 'class_number': 2,
  1074. 'task_type': 'classification',
  1075. 'ave_node_num': 17.77,
  1076. 'ave_edge_num': 18.16,
  1077. 'node_labeled': True,
  1078. 'edge_labeled': True,
  1079. 'node_attr_dim': 0,
  1080. 'geometry': None,
  1081. 'edge_attr_dim': 0,
  1082. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_training.zip',
  1083. 'domain': 'small molecules',
  1084. },
  1085. 'Tox21_AR-LBD_testing': {
  1086. 'database': 'tudataset',
  1087. 'reference': '[24]',
  1088. 'dataset_size': 253,
  1089. 'class_number': 2,
  1090. 'task_type': 'classification',
  1091. 'ave_node_num': 21.85,
  1092. 'ave_edge_num': 22.73,
  1093. 'node_labeled': True,
  1094. 'edge_labeled': True,
  1095. 'node_attr_dim': 0,
  1096. 'geometry': None,
  1097. 'edge_attr_dim': 0,
  1098. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_testing.zip',
  1099. 'domain': 'small molecules',
  1100. },
  1101. 'Tox21_AR-LBD_evaluation': {
  1102. 'database': 'tudataset',
  1103. 'reference': '[24]',
  1104. 'dataset_size': 580,
  1105. 'class_number': 2,
  1106. 'task_type': 'classification',
  1107. 'ave_node_num': 17.09,
  1108. 'ave_edge_num': 17.42,
  1109. 'node_labeled': True,
  1110. 'edge_labeled': True,
  1111. 'node_attr_dim': 0,
  1112. 'geometry': None,
  1113. 'edge_attr_dim': 0,
  1114. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_AR-LBD_evaluation.zip',
  1115. 'domain': 'small molecules',
  1116. },
  1117. 'Tox21_ARE_training': {
  1118. 'database': 'tudataset',
  1119. 'reference': '[24]',
  1120. 'dataset_size': 7167,
  1121. 'class_number': 2,
  1122. 'task_type': 'classification',
  1123. 'ave_node_num': 16.28,
  1124. 'ave_edge_num': 16.52,
  1125. 'node_labeled': True,
  1126. 'edge_labeled': True,
  1127. 'node_attr_dim': 0,
  1128. 'geometry': None,
  1129. 'edge_attr_dim': 0,
  1130. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_training.zip',
  1131. 'domain': 'small molecules',
  1132. },
  1133. 'Tox21_ARE_testing': {
  1134. 'database': 'tudataset',
  1135. 'reference': '[24]',
  1136. 'dataset_size': 234,
  1137. 'class_number': 2,
  1138. 'task_type': 'classification',
  1139. 'ave_node_num': 21.99,
  1140. 'ave_edge_num': 22.91,
  1141. 'node_labeled': True,
  1142. 'edge_labeled': True,
  1143. 'node_attr_dim': 0,
  1144. 'geometry': None,
  1145. 'edge_attr_dim': 0,
  1146. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_testing.zip',
  1147. 'domain': 'small molecules',
  1148. },
  1149. 'Tox21_ARE_evaluation': {
  1150. 'database': 'tudataset',
  1151. 'reference': '[24]',
  1152. 'dataset_size': 552,
  1153. 'class_number': 2,
  1154. 'task_type': 'classification',
  1155. 'ave_node_num': 17.01,
  1156. 'ave_edge_num': 17.33,
  1157. 'node_labeled': True,
  1158. 'edge_labeled': True,
  1159. 'node_attr_dim': 0,
  1160. 'geometry': None,
  1161. 'edge_attr_dim': 0,
  1162. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ARE_evaluation.zip',
  1163. 'domain': 'small molecules',
  1164. },
  1165. 'Tox21_aromatase_training': {
  1166. 'database': 'tudataset',
  1167. 'reference': '[24]',
  1168. 'dataset_size': 7226,
  1169. 'class_number': 2,
  1170. 'task_type': 'classification',
  1171. 'ave_node_num': 17.5,
  1172. 'ave_edge_num': 17.79,
  1173. 'node_labeled': True,
  1174. 'edge_labeled': True,
  1175. 'node_attr_dim': 0,
  1176. 'geometry': None,
  1177. 'edge_attr_dim': 0,
  1178. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_training.zip',
  1179. 'domain': 'small molecules',
  1180. },
  1181. 'Tox21_aromatase_testing': {
  1182. 'database': 'tudataset',
  1183. 'reference': '[24]',
  1184. 'dataset_size': 214,
  1185. 'class_number': 2,
  1186. 'task_type': 'classification',
  1187. 'ave_node_num': 21.65,
  1188. 'ave_edge_num': 22.36,
  1189. 'node_labeled': True,
  1190. 'edge_labeled': True,
  1191. 'node_attr_dim': 0,
  1192. 'geometry': None,
  1193. 'edge_attr_dim': 0,
  1194. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_testing.zip',
  1195. 'domain': 'small molecules',
  1196. },
  1197. 'Tox21_aromatase_evaluation': {
  1198. 'database': 'tudataset',
  1199. 'reference': '[24]',
  1200. 'dataset_size': 528,
  1201. 'class_number': 2,
  1202. 'task_type': 'classification',
  1203. 'ave_node_num': 16.74,
  1204. 'ave_edge_num': 16.99,
  1205. 'node_labeled': True,
  1206. 'edge_labeled': True,
  1207. 'node_attr_dim': 0,
  1208. 'geometry': None,
  1209. 'edge_attr_dim': 0,
  1210. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_aromatase_evaluation.zip',
  1211. 'domain': 'small molecules',
  1212. },
  1213. 'Tox21_ATAD5_training': {
  1214. 'database': 'tudataset',
  1215. 'reference': '[24]',
  1216. 'dataset_size': 9091,
  1217. 'class_number': 2,
  1218. 'task_type': 'classification',
  1219. 'ave_node_num': 17.89,
  1220. 'ave_edge_num': 18.3,
  1221. 'node_labeled': True,
  1222. 'edge_labeled': True,
  1223. 'node_attr_dim': 0,
  1224. 'geometry': None,
  1225. 'edge_attr_dim': 0,
  1226. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_training.zip',
  1227. 'domain': 'small molecules',
  1228. },
  1229. 'Tox21_ATAD5_testing': {
  1230. 'database': 'tudataset',
  1231. 'reference': '[24]',
  1232. 'dataset_size': 272,
  1233. 'class_number': 2,
  1234. 'task_type': 'classification',
  1235. 'ave_node_num': 21.99,
  1236. 'ave_edge_num': 22.89,
  1237. 'node_labeled': True,
  1238. 'edge_labeled': True,
  1239. 'node_attr_dim': 0,
  1240. 'geometry': None,
  1241. 'edge_attr_dim': 0,
  1242. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_testing.zip',
  1243. 'domain': 'small molecules',
  1244. },
  1245. 'Tox21_ATAD5_evaluation': {
  1246. 'database': 'tudataset',
  1247. 'reference': '[24]',
  1248. 'dataset_size': 619,
  1249. 'class_number': 2,
  1250. 'task_type': 'classification',
  1251. 'ave_node_num': 17.68,
  1252. 'ave_edge_num': 18.11,
  1253. 'node_labeled': True,
  1254. 'edge_labeled': True,
  1255. 'node_attr_dim': 0,
  1256. 'geometry': None,
  1257. 'edge_attr_dim': 0,
  1258. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ATAD5_evaluation.zip',
  1259. 'domain': 'small molecules',
  1260. },
  1261. 'Tox21_ER_training': {
  1262. 'database': 'tudataset',
  1263. 'reference': '[24]',
  1264. 'dataset_size': 7697,
  1265. 'class_number': 2,
  1266. 'task_type': 'classification',
  1267. 'ave_node_num': 17.58,
  1268. 'ave_edge_num': 17.94,
  1269. 'node_labeled': True,
  1270. 'edge_labeled': True,
  1271. 'node_attr_dim': 0,
  1272. 'geometry': None,
  1273. 'edge_attr_dim': 0,
  1274. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_training.zip',
  1275. 'domain': 'small molecules',
  1276. },
  1277. 'Tox21_ER_testing': {
  1278. 'database': 'tudataset',
  1279. 'reference': '[24]',
  1280. 'dataset_size': 265,
  1281. 'class_number': 2,
  1282. 'task_type': 'classification',
  1283. 'ave_node_num': 22.16,
  1284. 'ave_edge_num': 23.13,
  1285. 'node_labeled': True,
  1286. 'edge_labeled': True,
  1287. 'node_attr_dim': 0,
  1288. 'geometry': None,
  1289. 'edge_attr_dim': 0,
  1290. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_testing.zip',
  1291. 'domain': 'small molecules',
  1292. },
  1293. 'Tox21_ER_evaluation': {
  1294. 'database': 'tudataset',
  1295. 'reference': '[24]',
  1296. 'dataset_size': 515,
  1297. 'class_number': 2,
  1298. 'task_type': 'classification',
  1299. 'ave_node_num': 17.66,
  1300. 'ave_edge_num': 18.1,
  1301. 'node_labeled': True,
  1302. 'edge_labeled': True,
  1303. 'node_attr_dim': 0,
  1304. 'geometry': None,
  1305. 'edge_attr_dim': 0,
  1306. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER_evaluation.zip',
  1307. 'domain': 'small molecules',
  1308. },
  1309. 'Tox21_ER-LBD_training': {
  1310. 'database': 'tudataset',
  1311. 'reference': '[24]',
  1312. 'dataset_size': 8753,
  1313. 'class_number': 2,
  1314. 'task_type': 'classification',
  1315. 'ave_node_num': 18.06,
  1316. 'ave_edge_num': 18.47,
  1317. 'node_labeled': True,
  1318. 'edge_labeled': True,
  1319. 'node_attr_dim': 0,
  1320. 'geometry': None,
  1321. 'edge_attr_dim': 0,
  1322. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_training.zip',
  1323. 'domain': 'small molecules',
  1324. },
  1325. 'Tox21_ER-LBD_testing': {
  1326. 'database': 'tudataset',
  1327. 'reference': '[24]',
  1328. 'dataset_size': 287,
  1329. 'class_number': 2,
  1330. 'task_type': 'classification',
  1331. 'ave_node_num': 22.28,
  1332. 'ave_edge_num': 23.23,
  1333. 'node_labeled': True,
  1334. 'edge_labeled': True,
  1335. 'node_attr_dim': 0,
  1336. 'geometry': None,
  1337. 'edge_attr_dim': 0,
  1338. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_testing.zip',
  1339. 'domain': 'small molecules',
  1340. },
  1341. 'Tox21_ER-LBD_evaluation': {
  1342. 'database': 'tudataset',
  1343. 'reference': '[24]',
  1344. 'dataset_size': 599,
  1345. 'class_number': 2,
  1346. 'task_type': 'classification',
  1347. 'ave_node_num': 17.75,
  1348. 'ave_edge_num': 18.17,
  1349. 'node_labeled': True,
  1350. 'edge_labeled': True,
  1351. 'node_attr_dim': 0,
  1352. 'geometry': None,
  1353. 'edge_attr_dim': 0,
  1354. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_ER-LBD_evaluation.zip',
  1355. 'domain': 'small molecules',
  1356. },
  1357. 'Tox21_HSE_training': {
  1358. 'database': 'tudataset',
  1359. 'reference': '[24]',
  1360. 'dataset_size': 8150,
  1361. 'class_number': 2,
  1362. 'task_type': 'classification',
  1363. 'ave_node_num': 16.72,
  1364. 'ave_edge_num': 17.04,
  1365. 'node_labeled': True,
  1366. 'edge_labeled': True,
  1367. 'node_attr_dim': 0,
  1368. 'geometry': None,
  1369. 'edge_attr_dim': 0,
  1370. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_training.zip',
  1371. 'domain': 'small molecules',
  1372. },
  1373. 'Tox21_HSE_testing': {
  1374. 'database': 'tudataset',
  1375. 'reference': '[24]',
  1376. 'dataset_size': 267,
  1377. 'class_number': 2,
  1378. 'task_type': 'classification',
  1379. 'ave_node_num': 22.07,
  1380. 'ave_edge_num': 23.0,
  1381. 'node_labeled': True,
  1382. 'edge_labeled': True,
  1383. 'node_attr_dim': 0,
  1384. 'geometry': None,
  1385. 'edge_attr_dim': 0,
  1386. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_testing.zip',
  1387. 'domain': 'small molecules',
  1388. },
  1389. 'Tox21_HSE_evaluation': {
  1390. 'database': 'tudataset',
  1391. 'reference': '[24]',
  1392. 'dataset_size': 607,
  1393. 'class_number': 2,
  1394. 'task_type': 'classification',
  1395. 'ave_node_num': 17.61,
  1396. 'ave_edge_num': 18.01,
  1397. 'node_labeled': True,
  1398. 'edge_labeled': True,
  1399. 'node_attr_dim': 0,
  1400. 'geometry': None,
  1401. 'edge_attr_dim': 0,
  1402. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_HSE_evaluation.zip',
  1403. 'domain': 'small molecules',
  1404. },
  1405. 'Tox21_MMP_training': {
  1406. 'database': 'tudataset',
  1407. 'reference': '[24]',
  1408. 'dataset_size': 7320,
  1409. 'class_number': 2,
  1410. 'task_type': 'classification',
  1411. 'ave_node_num': 17.49,
  1412. 'ave_edge_num': 17.83,
  1413. 'node_labeled': True,
  1414. 'edge_labeled': True,
  1415. 'node_attr_dim': 0,
  1416. 'geometry': None,
  1417. 'edge_attr_dim': 0,
  1418. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_training.zip',
  1419. 'domain': 'small molecules',
  1420. },
  1421. 'Tox21_MMP_testing': {
  1422. 'database': 'tudataset',
  1423. 'reference': '[24]',
  1424. 'dataset_size': 238,
  1425. 'class_number': 2,
  1426. 'task_type': 'classification',
  1427. 'ave_node_num': 21.68,
  1428. 'ave_edge_num': 22.55,
  1429. 'node_labeled': True,
  1430. 'edge_labeled': True,
  1431. 'node_attr_dim': 0,
  1432. 'geometry': None,
  1433. 'edge_attr_dim': 0,
  1434. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_testing.zip',
  1435. 'domain': 'small molecules',
  1436. },
  1437. 'Tox21_MMP_evaluation': {
  1438. 'database': 'tudataset',
  1439. 'reference': '[24]',
  1440. 'dataset_size': 541,
  1441. 'class_number': 2,
  1442. 'task_type': 'classification',
  1443. 'ave_node_num': 16.67,
  1444. 'ave_edge_num': 16.88,
  1445. 'node_labeled': True,
  1446. 'edge_labeled': True,
  1447. 'node_attr_dim': 0,
  1448. 'geometry': None,
  1449. 'edge_attr_dim': 0,
  1450. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_MMP_evaluation.zip',
  1451. 'domain': 'small molecules',
  1452. },
  1453. 'Tox21_p53_training': {
  1454. 'database': 'tudataset',
  1455. 'reference': '[24]',
  1456. 'dataset_size': 8634,
  1457. 'class_number': 2,
  1458. 'task_type': 'classification',
  1459. 'ave_node_num': 17.79,
  1460. 'ave_edge_num': 18.19,
  1461. 'node_labeled': True,
  1462. 'edge_labeled': True,
  1463. 'node_attr_dim': 0,
  1464. 'geometry': None,
  1465. 'edge_attr_dim': 0,
  1466. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_training.zip',
  1467. 'domain': 'small molecules',
  1468. },
  1469. 'Tox21_p53_testing': {
  1470. 'database': 'tudataset',
  1471. 'reference': '[24]',
  1472. 'dataset_size': 269,
  1473. 'class_number': 2,
  1474. 'task_type': 'classification',
  1475. 'ave_node_num': 22.14,
  1476. 'ave_edge_num': 23.04,
  1477. 'node_labeled': True,
  1478. 'edge_labeled': True,
  1479. 'node_attr_dim': 0,
  1480. 'geometry': None,
  1481. 'edge_attr_dim': 0,
  1482. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_testing.zip',
  1483. 'domain': 'small molecules',
  1484. },
  1485. 'Tox21_p53_evaluation': {
  1486. 'database': 'tudataset',
  1487. 'reference': '[24]',
  1488. 'dataset_size': 613,
  1489. 'class_number': 2,
  1490. 'task_type': 'classification',
  1491. 'ave_node_num': 17.34,
  1492. 'ave_edge_num': 17.72,
  1493. 'node_labeled': True,
  1494. 'edge_labeled': True,
  1495. 'node_attr_dim': 0,
  1496. 'geometry': None,
  1497. 'edge_attr_dim': 0,
  1498. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_p53_evaluation.zip',
  1499. 'domain': 'small molecules',
  1500. },
  1501. 'Tox21_PPAR-gamma_training': {
  1502. 'database': 'tudataset',
  1503. 'reference': '[24]',
  1504. 'dataset_size': 8184,
  1505. 'class_number': 2,
  1506. 'task_type': 'classification',
  1507. 'ave_node_num': 17.23,
  1508. 'ave_edge_num': 17.55,
  1509. 'node_labeled': True,
  1510. 'edge_labeled': True,
  1511. 'node_attr_dim': 0,
  1512. 'geometry': None,
  1513. 'edge_attr_dim': 0,
  1514. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_training.zip',
  1515. 'domain': 'small molecules',
  1516. },
  1517. 'Tox21_PPAR-gamma_testing': {
  1518. 'database': 'tudataset',
  1519. 'reference': '[24]',
  1520. 'dataset_size': 267,
  1521. 'class_number': 2,
  1522. 'task_type': 'classification',
  1523. 'ave_node_num': 22.04,
  1524. 'ave_edge_num': 22.93,
  1525. 'node_labeled': True,
  1526. 'edge_labeled': True,
  1527. 'node_attr_dim': 0,
  1528. 'geometry': None,
  1529. 'edge_attr_dim': 0,
  1530. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_testing.zip',
  1531. 'domain': 'small molecules',
  1532. },
  1533. 'Tox21_PPAR-gamma_evaluation': {
  1534. 'database': 'tudataset',
  1535. 'reference': '[24]',
  1536. 'dataset_size': 602,
  1537. 'class_number': 2,
  1538. 'task_type': 'classification',
  1539. 'ave_node_num': 17.38,
  1540. 'ave_edge_num': 17.77,
  1541. 'node_labeled': True,
  1542. 'edge_labeled': True,
  1543. 'node_attr_dim': 0,
  1544. 'geometry': None,
  1545. 'edge_attr_dim': 0,
  1546. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Tox21_PPAR-gamma_evaluation.zip',
  1547. 'domain': 'small molecules',
  1548. },
  1549. 'UACC257': {
  1550. 'database': 'tudataset',
  1551. 'reference': '[28]',
  1552. 'dataset_size': 39988,
  1553. 'class_number': 2,
  1554. 'task_type': 'classification',
  1555. 'ave_node_num': 26.09,
  1556. 'ave_edge_num': 28.12,
  1557. 'node_labeled': True,
  1558. 'edge_labeled': True,
  1559. 'node_attr_dim': 0,
  1560. 'geometry': None,
  1561. 'edge_attr_dim': 0,
  1562. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/UACC257.zip',
  1563. 'domain': 'small molecules',
  1564. },
  1565. 'UACC257H': {
  1566. 'database': 'tudataset',
  1567. 'reference': '[28]',
  1568. 'dataset_size': 39988,
  1569. 'class_number': 2,
  1570. 'task_type': 'classification',
  1571. 'ave_node_num': 46.68,
  1572. 'ave_edge_num': 48.71,
  1573. 'node_labeled': True,
  1574. 'edge_labeled': True,
  1575. 'node_attr_dim': 0,
  1576. 'geometry': None,
  1577. 'edge_attr_dim': 0,
  1578. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/UACC257H.zip',
  1579. 'domain': 'small molecules',
  1580. },
  1581. 'uracil': {
  1582. 'database': 'tudataset',
  1583. 'reference': '[36]',
  1584. 'dataset_size': 133770,
  1585. 'class_number': None,
  1586. 'task_type': 'regression',
  1587. 'ave_node_num': 12.0,
  1588. 'ave_edge_num': 64.44,
  1589. 'node_labeled': True,
  1590. 'edge_labeled': False,
  1591. 'node_attr_dim': 6,
  1592. 'geometry': '3D, RI',
  1593. 'edge_attr_dim': 0,
  1594. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/uracil.zip',
  1595. 'domain': 'small molecules',
  1596. },
  1597. 'Yeast': {
  1598. 'database': 'tudataset',
  1599. 'reference': '[28]',
  1600. 'dataset_size': 79601,
  1601. 'class_number': 2,
  1602. 'task_type': 'classification',
  1603. 'ave_node_num': 21.54,
  1604. 'ave_edge_num': 22.84,
  1605. 'node_labeled': True,
  1606. 'edge_labeled': True,
  1607. 'node_attr_dim': 0,
  1608. 'geometry': None,
  1609. 'edge_attr_dim': 0,
  1610. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Yeast.zip',
  1611. 'domain': 'small molecules',
  1612. },
  1613. 'YeastH': {
  1614. 'database': 'tudataset',
  1615. 'reference': '[28]',
  1616. 'dataset_size': 79601,
  1617. 'class_number': 2,
  1618. 'task_type': 'classification',
  1619. 'ave_node_num': 39.44,
  1620. 'ave_edge_num': 40.74,
  1621. 'node_labeled': True,
  1622. 'edge_labeled': True,
  1623. 'node_attr_dim': 0,
  1624. 'geometry': None,
  1625. 'edge_attr_dim': 0,
  1626. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/YeastH.zip',
  1627. 'domain': 'small molecules',
  1628. },
  1629. 'ZINC_full': {
  1630. 'database': 'tudataset',
  1631. 'reference': '[31]',
  1632. 'dataset_size': 249456,
  1633. 'class_number': None,
  1634. 'task_type': 'regression',
  1635. 'ave_node_num': 23.14,
  1636. 'ave_edge_num': 24.91,
  1637. 'node_labeled': True,
  1638. 'edge_labeled': True,
  1639. 'node_attr_dim': 0,
  1640. 'geometry': None,
  1641. 'edge_attr_dim': 0,
  1642. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_full.zip',
  1643. 'domain': 'small molecules',
  1644. },
  1645. 'ZINC_test': {
  1646. 'database': 'tudataset',
  1647. 'reference': '[31]',
  1648. 'dataset_size': 5000,
  1649. 'class_number': None,
  1650. 'task_type': 'regression',
  1651. 'ave_node_num': 23.1,
  1652. 'ave_edge_num': 24.83,
  1653. 'node_labeled': True,
  1654. 'edge_labeled': True,
  1655. 'node_attr_dim': 0,
  1656. 'geometry': None,
  1657. 'edge_attr_dim': 0,
  1658. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_test.zip',
  1659. 'domain': 'small molecules',
  1660. },
  1661. 'ZINC_train': {
  1662. 'database': 'tudataset',
  1663. 'reference': '[31]',
  1664. 'dataset_size': 220011,
  1665. 'class_number': None,
  1666. 'task_type': 'regression',
  1667. 'ave_node_num': 23.15,
  1668. 'ave_edge_num': 24.91,
  1669. 'node_labeled': True,
  1670. 'edge_labeled': True,
  1671. 'node_attr_dim': 0,
  1672. 'geometry': None,
  1673. 'edge_attr_dim': 0,
  1674. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_train.zip',
  1675. 'domain': 'small molecules',
  1676. },
  1677. 'ZINC_val': {
  1678. 'database': 'tudataset',
  1679. 'reference': '[31]',
  1680. 'dataset_size': 24445,
  1681. 'class_number': None,
  1682. 'task_type': 'regression',
  1683. 'ave_node_num': 23.13,
  1684. 'ave_edge_num': 24.88,
  1685. 'node_labeled': True,
  1686. 'edge_labeled': True,
  1687. 'node_attr_dim': 0,
  1688. 'geometry': None,
  1689. 'edge_attr_dim': 0,
  1690. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/ZINC_val.zip',
  1691. 'domain': 'small molecules',
  1692. },
  1693. ### bioinformatics
  1694. 'DD': {
  1695. 'database': 'tudataset',
  1696. 'reference': '[6,22]',
  1697. 'dataset_size': 1178,
  1698. 'class_number': 2,
  1699. 'task_type': 'classification',
  1700. 'ave_node_num': 284.32,
  1701. 'ave_edge_num': 715.66,
  1702. 'node_labeled': True,
  1703. 'edge_labeled': False,
  1704. 'node_attr_dim': 0,
  1705. 'geometry': None,
  1706. 'edge_attr_dim': 0,
  1707. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DD.zip',
  1708. 'domain': 'bioinformatics',
  1709. },
  1710. 'ENZYMES': {
  1711. 'database': 'tudataset',
  1712. 'reference': '[4,5]',
  1713. 'dataset_size': 600,
  1714. 'class_number': 6,
  1715. 'task_type': 'classification',
  1716. 'ave_node_num': 32.63,
  1717. 'ave_edge_num': 62.14,
  1718. 'node_labeled': True,
  1719. 'edge_labeled': False,
  1720. 'node_attr_dim': 18,
  1721. 'geometry': None,
  1722. 'edge_attr_dim': 0,
  1723. 'url': 'http://www.chrsmrrs.com/graphkerneldatasets/ENZYMES.zip',
  1724. 'domain': 'bioinformatics',
  1725. },
  1726. 'KKI': {
  1727. 'database': 'tudataset',
  1728. 'reference': '[26]',
  1729. 'dataset_size': 83,
  1730. 'class_number': 2,
  1731. 'task_type': 'classification',
  1732. 'ave_node_num': 26.96,
  1733. 'ave_edge_num': 48.42,
  1734. 'node_labeled': True,
  1735. 'edge_labeled': False,
  1736. 'node_attr_dim': 0,
  1737. 'geometry': None,
  1738. 'edge_attr_dim': 0,
  1739. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/KKI.zip',
  1740. 'domain': 'bioinformatics',
  1741. },
  1742. 'OHSU': {
  1743. 'database': 'tudataset',
  1744. 'reference': '[26]',
  1745. 'dataset_size': 79,
  1746. 'class_number': 2,
  1747. 'task_type': 'classification',
  1748. 'ave_node_num': 82.01,
  1749. 'ave_edge_num': 199.66,
  1750. 'node_labeled': True,
  1751. 'edge_labeled': False,
  1752. 'node_attr_dim': 0,
  1753. 'geometry': None,
  1754. 'edge_attr_dim': 0,
  1755. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/OHSU.zip',
  1756. 'domain': 'bioinformatics',
  1757. },
  1758. 'Peking_1': {
  1759. 'database': 'tudataset',
  1760. 'reference': '[26]',
  1761. 'dataset_size': 85,
  1762. 'class_number': 2,
  1763. 'task_type': 'classification',
  1764. 'ave_node_num': 39.31,
  1765. 'ave_edge_num': 77.35,
  1766. 'node_labeled': True,
  1767. 'edge_labeled': False,
  1768. 'node_attr_dim': 0,
  1769. 'geometry': None,
  1770. 'edge_attr_dim': 0,
  1771. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Peking_1.zip',
  1772. 'domain': 'bioinformatics',
  1773. },
  1774. 'PROTEINS': {
  1775. 'database': 'tudataset',
  1776. 'reference': '[4,6]',
  1777. 'dataset_size': 1113,
  1778. 'class_number': 2,
  1779. 'task_type': 'classification',
  1780. 'ave_node_num': 39.06,
  1781. 'ave_edge_num': 72.82,
  1782. 'node_labeled': True,
  1783. 'edge_labeled': False,
  1784. 'node_attr_dim': 1,
  1785. 'geometry': None,
  1786. 'edge_attr_dim': 0,
  1787. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PROTEINS.zip',
  1788. 'domain': 'bioinformatics',
  1789. },
  1790. 'PROTEINS_full': {
  1791. 'database': 'tudataset',
  1792. 'reference': '[4,6]',
  1793. 'dataset_size': 1113,
  1794. 'class_number': 2,
  1795. 'task_type': 'classification',
  1796. 'ave_node_num': 39.06,
  1797. 'ave_edge_num': 72.82,
  1798. 'node_labeled': True,
  1799. 'edge_labeled': False,
  1800. 'node_attr_dim': 29,
  1801. 'geometry': None,
  1802. 'edge_attr_dim': 0,
  1803. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/PROTEINS_full.zip',
  1804. 'domain': 'bioinformatics',
  1805. },
  1806. ### computer vision
  1807. 'COIL-DEL': {
  1808. 'database': 'tudataset',
  1809. 'reference': '[16,18]',
  1810. 'dataset_size': 3900,
  1811. 'class_number': 100,
  1812. 'task_type': 'classification',
  1813. 'ave_node_num': 21.54,
  1814. 'ave_edge_num': 54.24,
  1815. 'node_labeled': False,
  1816. 'edge_labeled': True,
  1817. 'node_attr_dim': 2,
  1818. 'geometry': None,
  1819. 'edge_attr_dim': 0,
  1820. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COIL-DEL.zip',
  1821. 'domain': 'computer vision',
  1822. },
  1823. 'COIL-RAG': {
  1824. 'database': 'tudataset',
  1825. 'reference': '[16,18]',
  1826. 'dataset_size': 3900,
  1827. 'class_number': 100,
  1828. 'task_type': 'classification',
  1829. 'ave_node_num': 3.01,
  1830. 'ave_edge_num': 3.02,
  1831. 'node_labeled': False,
  1832. 'edge_labeled': False,
  1833. 'node_attr_dim': 64,
  1834. 'geometry': None,
  1835. 'edge_attr_dim': 1,
  1836. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COIL-RAG.zip',
  1837. 'domain': 'computer vision',
  1838. },
  1839. 'Cuneiform': {
  1840. 'database': 'tudataset',
  1841. 'reference': '[25]',
  1842. 'dataset_size': 267,
  1843. 'class_number': 30,
  1844. 'task_type': 'classification',
  1845. 'ave_node_num': 21.27,
  1846. 'ave_edge_num': 44.8,
  1847. 'node_labeled': True,
  1848. 'edge_labeled': True,
  1849. 'node_attr_dim': 3,
  1850. 'geometry': '3D',
  1851. 'edge_attr_dim': 2,
  1852. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Cuneiform.zip',
  1853. 'domain': 'computer vision',
  1854. },
  1855. 'Fingerprint': {
  1856. 'database': 'tudataset',
  1857. 'reference': '[16,19]',
  1858. 'dataset_size': 2800,
  1859. 'class_number': 4,
  1860. 'task_type': 'classification',
  1861. 'ave_node_num': 5.42,
  1862. 'ave_edge_num': 4.42,
  1863. 'node_labeled': False,
  1864. 'edge_labeled': False,
  1865. 'node_attr_dim': 2,
  1866. 'geometry': '2D',
  1867. 'edge_attr_dim': 2,
  1868. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Fingerprint.zip',
  1869. 'domain': 'computer vision',
  1870. },
  1871. 'FIRSTMM_DB': {
  1872. 'database': 'tudataset',
  1873. 'reference': '[11,12,13]',
  1874. 'dataset_size': 41,
  1875. 'class_number': 11,
  1876. 'task_type': 'classification',
  1877. 'ave_node_num': 1377.27,
  1878. 'ave_edge_num': 3074.1,
  1879. 'node_labeled': True,
  1880. 'edge_labeled': False,
  1881. 'node_attr_dim': 1,
  1882. 'geometry': None,
  1883. 'edge_attr_dim': 2,
  1884. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/FIRSTMM_DB.zip',
  1885. 'domain': 'computer vision',
  1886. },
  1887. 'Letter-high': {
  1888. 'database': 'tudataset',
  1889. 'reference': '[16]',
  1890. 'dataset_size': 2250,
  1891. 'class_number': 15,
  1892. 'task_type': 'classification',
  1893. 'ave_node_num': 4.67,
  1894. 'ave_edge_num': 4.5,
  1895. 'node_labeled': False,
  1896. 'edge_labeled': False,
  1897. 'node_attr_dim': 2,
  1898. 'geometry': '2D',
  1899. 'edge_attr_dim': 0,
  1900. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-high.zip',
  1901. 'domain': 'computer vision',
  1902. },
  1903. 'Letter-low': {
  1904. 'database': 'tudataset',
  1905. 'reference': '[16]',
  1906. 'dataset_size': 2250,
  1907. 'class_number': 15,
  1908. 'task_type': 'classification',
  1909. 'ave_node_num': 4.68,
  1910. 'ave_edge_num': 3.13,
  1911. 'node_labeled': False,
  1912. 'edge_labeled': False,
  1913. 'node_attr_dim': 2,
  1914. 'geometry': '2D',
  1915. 'edge_attr_dim': 0,
  1916. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-low.zip',
  1917. 'domain': 'computer vision',
  1918. },
  1919. 'Letter-med': {
  1920. 'database': 'tudataset',
  1921. 'reference': '[16]',
  1922. 'dataset_size': 2250,
  1923. 'class_number': 15,
  1924. 'task_type': 'classification',
  1925. 'ave_node_num': 4.67,
  1926. 'ave_edge_num': 4.5,
  1927. 'node_labeled': False,
  1928. 'edge_labeled': False,
  1929. 'node_attr_dim': 2,
  1930. 'geometry': '2D',
  1931. 'edge_attr_dim': 0,
  1932. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Letter-med.zip',
  1933. 'domain': 'computer vision',
  1934. },
  1935. 'MSRC_9': {
  1936. 'database': 'tudataset',
  1937. 'reference': '[13]',
  1938. 'dataset_size': 221,
  1939. 'class_number': 8,
  1940. 'task_type': 'classification',
  1941. 'ave_node_num': 40.58,
  1942. 'ave_edge_num': 97.94,
  1943. 'node_labeled': True,
  1944. 'edge_labeled': False,
  1945. 'node_attr_dim': 0,
  1946. 'geometry': None,
  1947. 'edge_attr_dim': 0,
  1948. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_9.zip',
  1949. 'domain': 'computer vision',
  1950. },
  1951. 'MSRC_21': {
  1952. 'database': 'tudataset',
  1953. 'reference': '[13]',
  1954. 'dataset_size': 563,
  1955. 'class_number': 20,
  1956. 'task_type': 'classification',
  1957. 'ave_node_num': 77.52,
  1958. 'ave_edge_num': 198.32,
  1959. 'node_labeled': True,
  1960. 'edge_labeled': False,
  1961. 'node_attr_dim': 0,
  1962. 'geometry': None,
  1963. 'edge_attr_dim': 0,
  1964. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_21.zip',
  1965. 'domain': 'computer vision',
  1966. },
  1967. 'MSRC_21C': {
  1968. 'database': 'tudataset',
  1969. 'reference': '[13]',
  1970. 'dataset_size': 209,
  1971. 'class_number': 20,
  1972. 'task_type': 'classification',
  1973. 'ave_node_num': 40.28,
  1974. 'ave_edge_num': 96.6,
  1975. 'node_labeled': True,
  1976. 'edge_labeled': False,
  1977. 'node_attr_dim': 0,
  1978. 'geometry': None,
  1979. 'edge_attr_dim': 0,
  1980. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/MSRC_21C.zip',
  1981. 'domain': 'computer vision',
  1982. },
  1983. ### social networks
  1984. 'COLLAB': {
  1985. 'database': 'tudataset',
  1986. 'reference': '[14]',
  1987. 'dataset_size': 5000,
  1988. 'class_number': 3,
  1989. 'task_type': 'classification',
  1990. 'ave_node_num': 74.49,
  1991. 'ave_edge_num': 2457.78,
  1992. 'node_labeled': False,
  1993. 'edge_labeled': False,
  1994. 'node_attr_dim': 0,
  1995. 'geometry': None,
  1996. 'edge_attr_dim': 0,
  1997. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COLLAB.zip',
  1998. 'domain': 'social networks',
  1999. },
  2000. 'dblp_ct1': {
  2001. 'database': 'tudataset',
  2002. 'reference': '[32]',
  2003. 'dataset_size': 755,
  2004. 'class_number': 2,
  2005. 'task_type': 'classification',
  2006. 'ave_node_num': 52.87,
  2007. 'ave_edge_num': 320.09,
  2008. 'node_labeled': False,
  2009. 'edge_labeled': False,
  2010. 'node_attr_dim': 0,
  2011. 'geometry': None,
  2012. 'edge_attr_dim': 'temporal',
  2013. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/dblp_ct1.zip',
  2014. 'domain': 'social networks',
  2015. },
  2016. 'dblp_ct2': {
  2017. 'database': 'tudataset',
  2018. 'reference': '[32]',
  2019. 'dataset_size': 755,
  2020. 'class_number': 2,
  2021. 'task_type': 'classification',
  2022. 'ave_node_num': 52.87,
  2023. 'ave_edge_num': 320.09,
  2024. 'node_labeled': False,
  2025. 'edge_labeled': False,
  2026. 'node_attr_dim': 0,
  2027. 'geometry': None,
  2028. 'edge_attr_dim': 'temporal',
  2029. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/dblp_ct2.zip',
  2030. 'domain': 'social networks',
  2031. },
  2032. 'DBLP_v1': {
  2033. 'database': 'tudataset',
  2034. 'reference': '[26]',
  2035. 'dataset_size': 19456,
  2036. 'class_number': 2,
  2037. 'task_type': 'classification',
  2038. 'ave_node_num': 10.48,
  2039. 'ave_edge_num': 19.65,
  2040. 'node_labeled': True,
  2041. 'edge_labeled': True,
  2042. 'node_attr_dim': 0,
  2043. 'geometry': None,
  2044. 'edge_attr_dim': 0,
  2045. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/DBLP_v1.zip',
  2046. 'domain': 'social networks',
  2047. },
  2048. 'deezer_ego_nets': {
  2049. 'database': 'tudataset',
  2050. 'reference': '[30]',
  2051. 'dataset_size': 9629,
  2052. 'class_number': 2,
  2053. 'task_type': 'classification',
  2054. 'ave_node_num': 23.49,
  2055. 'ave_edge_num': 65.25,
  2056. 'node_labeled': False,
  2057. 'edge_labeled': False,
  2058. 'node_attr_dim': 0,
  2059. 'geometry': None,
  2060. 'edge_attr_dim': 0,
  2061. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/deezer_ego_nets.zip',
  2062. 'domain': 'social networks',
  2063. },
  2064. 'facebook_ct1': {
  2065. 'database': 'tudataset',
  2066. 'reference': '[32]',
  2067. 'dataset_size': 995,
  2068. 'class_number': 2,
  2069. 'task_type': 'classification',
  2070. 'ave_node_num': 95.72,
  2071. 'ave_edge_num': 269.01,
  2072. 'node_labeled': False,
  2073. 'edge_labeled': False,
  2074. 'node_attr_dim': 0,
  2075. 'geometry': None,
  2076. 'edge_attr_dim': 'temporal',
  2077. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/facebook_ct1.zip',
  2078. 'domain': 'social networks',
  2079. },
  2080. 'facebook_ct2': {
  2081. 'database': 'tudataset',
  2082. 'reference': '[32]',
  2083. 'dataset_size': 995,
  2084. 'class_number': 2,
  2085. 'task_type': 'classification',
  2086. 'ave_node_num': 95.72,
  2087. 'ave_edge_num': 269.01,
  2088. 'node_labeled': False,
  2089. 'edge_labeled': False,
  2090. 'node_attr_dim': 0,
  2091. 'geometry': None,
  2092. 'edge_attr_dim': 'temporal',
  2093. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/facebook_ct2.zip',
  2094. 'domain': 'social networks',
  2095. },
  2096. 'github_stargazers': {
  2097. 'database': 'tudataset',
  2098. 'reference': '[30]',
  2099. 'dataset_size': 12725,
  2100. 'class_number': 2,
  2101. 'task_type': 'classification',
  2102. 'ave_node_num': 113.79,
  2103. 'ave_edge_num': 234.64,
  2104. 'node_labeled': False,
  2105. 'edge_labeled': False,
  2106. 'node_attr_dim': 0,
  2107. 'geometry': None,
  2108. 'edge_attr_dim': 0,
  2109. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/github_stargazers.zip',
  2110. 'domain': 'social networks',
  2111. },
  2112. 'highschool_ct1': {
  2113. 'database': 'tudataset',
  2114. 'reference': '[32]',
  2115. 'dataset_size': 180,
  2116. 'class_number': 2,
  2117. 'task_type': 'classification',
  2118. 'ave_node_num': 52.32,
  2119. 'ave_edge_num': 544.81,
  2120. 'node_labeled': False,
  2121. 'edge_labeled': False,
  2122. 'node_attr_dim': 0,
  2123. 'geometry': None,
  2124. 'edge_attr_dim': 'temporal',
  2125. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/highschool_ct1.zip',
  2126. 'domain': 'social networks',
  2127. },
  2128. 'highschool_ct2': {
  2129. 'database': 'tudataset',
  2130. 'reference': '[32]',
  2131. 'dataset_size': 180,
  2132. 'class_number': 2,
  2133. 'task_type': 'classification',
  2134. 'ave_node_num': 52.32,
  2135. 'ave_edge_num': 544.81,
  2136. 'node_labeled': False,
  2137. 'edge_labeled': False,
  2138. 'node_attr_dim': 0,
  2139. 'geometry': None,
  2140. 'edge_attr_dim': 'temporal',
  2141. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/highschool_ct2.zip',
  2142. 'domain': 'social networks',
  2143. },
  2144. 'IMDB-BINARY': {
  2145. 'database': 'tudataset',
  2146. 'reference': '[14]',
  2147. 'dataset_size': 1000,
  2148. 'class_number': 2,
  2149. 'task_type': 'classification',
  2150. 'ave_node_num': 19.77,
  2151. 'ave_edge_num': 96.53,
  2152. 'node_labeled': False,
  2153. 'edge_labeled': False,
  2154. 'node_attr_dim': 0,
  2155. 'geometry': '',
  2156. 'edge_attr_dim': 0,
  2157. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/IMDB-BINARY.zip',
  2158. 'domain': 'social networks',
  2159. },
  2160. 'IMDB-MULTI': {
  2161. 'database': 'tudataset',
  2162. 'reference': '[14]',
  2163. 'dataset_size': 1500,
  2164. 'class_number': 3,
  2165. 'task_type': 'classification',
  2166. 'ave_node_num': 13.0,
  2167. 'ave_edge_num': 65.94,
  2168. 'node_labeled': False,
  2169. 'edge_labeled': False,
  2170. 'node_attr_dim': 0,
  2171. 'geometry': '',
  2172. 'edge_attr_dim': 0,
  2173. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/IMDB-MULTI.zip',
  2174. 'domain': 'social networks',
  2175. },
  2176. 'infectious_ct1': {
  2177. 'database': 'tudataset',
  2178. 'reference': '[32]',
  2179. 'dataset_size': 200,
  2180. 'class_number': 2,
  2181. 'task_type': 'classification',
  2182. 'ave_node_num': 50.0,
  2183. 'ave_edge_num': 459.72,
  2184. 'node_labeled': False,
  2185. 'edge_labeled': False,
  2186. 'node_attr_dim': 0,
  2187. 'geometry': None,
  2188. 'edge_attr_dim': 'temporal',
  2189. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/infectious_ct1.zip',
  2190. 'domain': 'social networks',
  2191. },
  2192. 'infectious_ct2': {
  2193. 'database': 'tudataset',
  2194. 'reference': '[32]',
  2195. 'dataset_size': 200,
  2196. 'class_number': 2,
  2197. 'task_type': 'classification',
  2198. 'ave_node_num': 50.0,
  2199. 'ave_edge_num': 459.72,
  2200. 'node_labeled': False,
  2201. 'edge_labeled': False,
  2202. 'node_attr_dim': 0,
  2203. 'geometry': None,
  2204. 'edge_attr_dim': 'temporal',
  2205. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/infectious_ct2.zip',
  2206. 'domain': 'social networks',
  2207. },
  2208. 'mit_ct1': {
  2209. 'database': 'tudataset',
  2210. 'reference': '[32]',
  2211. 'dataset_size': 97,
  2212. 'class_number': 2,
  2213. 'task_type': 'classification',
  2214. 'ave_node_num': 20.0,
  2215. 'ave_edge_num': 1469.15,
  2216. 'node_labeled': False,
  2217. 'edge_labeled': False,
  2218. 'node_attr_dim': 0,
  2219. 'geometry': None,
  2220. 'edge_attr_dim': 'temporal',
  2221. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/mit_ct1.zip',
  2222. 'domain': 'social networks',
  2223. },
  2224. 'mit_ct2': {
  2225. 'database': 'tudataset',
  2226. 'reference': '[32]',
  2227. 'dataset_size': 97,
  2228. 'class_number': 2,
  2229. 'task_type': 'classification',
  2230. 'ave_node_num': 20.0,
  2231. 'ave_edge_num': 1469.15,
  2232. 'node_labeled': False,
  2233. 'edge_labeled': False,
  2234. 'node_attr_dim': 0,
  2235. 'geometry': None,
  2236. 'edge_attr_dim': 'temporal',
  2237. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/mit_ct2.zip',
  2238. 'domain': 'social networks',
  2239. },
  2240. 'REDDIT-BINARY': {
  2241. 'database': 'tudataset',
  2242. 'reference': '[14]',
  2243. 'dataset_size': 2000,
  2244. 'class_number': 2,
  2245. 'task_type': 'classification',
  2246. 'ave_node_num': 429.63,
  2247. 'ave_edge_num': 497.75,
  2248. 'node_labeled': False,
  2249. 'edge_labeled': False,
  2250. 'node_attr_dim': 0,
  2251. 'geometry': None,
  2252. 'edge_attr_dim': 0,
  2253. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-BINARY.zip',
  2254. 'domain': 'social networks',
  2255. },
  2256. 'REDDIT-MULTI-5K': {
  2257. 'database': 'tudataset',
  2258. 'reference': '[14]',
  2259. 'dataset_size': 4999,
  2260. 'class_number': 5,
  2261. 'task_type': 'classification',
  2262. 'ave_node_num': 508.52,
  2263. 'ave_edge_num': 594.87,
  2264. 'node_labeled': False,
  2265. 'edge_labeled': False,
  2266. 'node_attr_dim': 0,
  2267. 'geometry': None,
  2268. 'edge_attr_dim': 0,
  2269. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-MULTI-5K.zip',
  2270. 'domain': 'social networks',
  2271. },
  2272. 'REDDIT-MULTI-12K': {
  2273. 'database': 'tudataset',
  2274. 'reference': '[14]',
  2275. 'dataset_size': 11929,
  2276. 'class_number': 11,
  2277. 'task_type': 'classification',
  2278. 'ave_node_num': 391.41,
  2279. 'ave_edge_num': 456.89,
  2280. 'node_labeled': False,
  2281. 'edge_labeled': False,
  2282. 'node_attr_dim': 0,
  2283. 'geometry': None,
  2284. 'edge_attr_dim': 0,
  2285. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/REDDIT-MULTI-12K.zip',
  2286. 'domain': 'social networks',
  2287. },
  2288. 'reddit_threads': {
  2289. 'database': 'tudataset',
  2290. 'reference': '[30]',
  2291. 'dataset_size': 203088,
  2292. 'class_number': 2,
  2293. 'task_type': 'classification',
  2294. 'ave_node_num': 23.93,
  2295. 'ave_edge_num': 24.99,
  2296. 'node_labeled': False,
  2297. 'edge_labeled': False,
  2298. 'node_attr_dim': 0,
  2299. 'geometry': None,
  2300. 'edge_attr_dim': 0,
  2301. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/reddit_threads.zip',
  2302. 'domain': 'social networks',
  2303. },
  2304. 'tumblr_ct1': {
  2305. 'database': 'tudataset',
  2306. 'reference': '[32]',
  2307. 'dataset_size': 373,
  2308. 'class_number': 2,
  2309. 'task_type': 'classification',
  2310. 'ave_node_num': 53.11,
  2311. 'ave_edge_num': 199.78,
  2312. 'node_labeled': False,
  2313. 'edge_labeled': False,
  2314. 'node_attr_dim': 0,
  2315. 'geometry': None,
  2316. 'edge_attr_dim': 'temporal',
  2317. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/tumblr_ct1.zip',
  2318. 'domain': 'social networks',
  2319. },
  2320. 'tumblr_ct2': {
  2321. 'database': 'tudataset',
  2322. 'reference': '[32]',
  2323. 'dataset_size': 373,
  2324. 'class_number': 2,
  2325. 'task_type': 'classification',
  2326. 'ave_node_num': 53.11,
  2327. 'ave_edge_num': 199.78,
  2328. 'node_labeled': False,
  2329. 'edge_labeled': False,
  2330. 'node_attr_dim': 0,
  2331. 'geometry': None,
  2332. 'edge_attr_dim': 'temporal',
  2333. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/tumblr_ct2.zip',
  2334. 'domain': 'social networks',
  2335. },
  2336. 'twitch_egos': {
  2337. 'database': 'tudataset',
  2338. 'reference': '[30]',
  2339. 'dataset_size': 127094,
  2340. 'class_number': 2,
  2341. 'task_type': 'classification',
  2342. 'ave_node_num': 29.67,
  2343. 'ave_edge_num': 86.59,
  2344. 'node_labeled': False,
  2345. 'edge_labeled': False,
  2346. 'node_attr_dim': 0,
  2347. 'geometry': None,
  2348. 'edge_attr_dim': 0,
  2349. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/twitch_egos.zip',
  2350. 'domain': 'social networks',
  2351. },
  2352. 'TWITTER-Real-Graph-Partial': {
  2353. 'database': 'tudataset',
  2354. 'reference': '[26]',
  2355. 'dataset_size': 144033,
  2356. 'class_number': 2,
  2357. 'task_type': 'classification',
  2358. 'ave_node_num': 4.03,
  2359. 'ave_edge_num': 4.98,
  2360. 'node_labeled': True,
  2361. 'edge_labeled': False,
  2362. 'node_attr_dim': 0,
  2363. 'geometry': None,
  2364. 'edge_attr_dim': 1,
  2365. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/TWITTER-Real-Graph-Partial.zip',
  2366. 'domain': 'social networks',
  2367. },
  2368. ### synthetic
  2369. 'COLORS-3': {
  2370. 'database': 'tudataset',
  2371. 'reference': '[27]',
  2372. 'dataset_size': 10500,
  2373. 'class_number': 11,
  2374. 'task_type': 'classification',
  2375. 'ave_node_num': 61.31,
  2376. 'ave_edge_num': 91.03,
  2377. 'node_labeled': False,
  2378. 'edge_labeled': False,
  2379. 'node_attr_dim': 4,
  2380. 'geometry': None,
  2381. 'edge_attr_dim': 0,
  2382. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/COLORS-3.zip',
  2383. 'domain': 'synthetic',
  2384. },
  2385. 'SYNTHETIC': {
  2386. 'database': 'tudataset',
  2387. 'reference': '[3]',
  2388. 'dataset_size': 300,
  2389. 'class_number': 2,
  2390. 'task_type': 'classification',
  2391. 'ave_node_num': 100.0,
  2392. 'ave_edge_num': 196.0,
  2393. 'node_labeled': False,
  2394. 'edge_labeled': False,
  2395. 'node_attr_dim': 1,
  2396. 'geometry': None,
  2397. 'edge_attr_dim': 0,
  2398. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SYNTHETIC.zip',
  2399. 'domain': 'synthetic',
  2400. },
  2401. 'SYNTHETICnew': {
  2402. 'database': 'tudataset',
  2403. 'reference': '[3,10]',
  2404. 'dataset_size': 300,
  2405. 'class_number': 2,
  2406. 'task_type': 'classification',
  2407. 'ave_node_num': 100.0,
  2408. 'ave_edge_num': 196.25,
  2409. 'node_labeled': False,
  2410. 'edge_labeled': False,
  2411. 'node_attr_dim': 1,
  2412. 'geometry': None,
  2413. 'edge_attr_dim': 0,
  2414. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/SYNTHETICnew.zip',
  2415. 'domain': 'synthetic',
  2416. },
  2417. 'Synthie': {
  2418. 'database': 'tudataset',
  2419. 'reference': '[21]',
  2420. 'dataset_size': 400,
  2421. 'class_number': 4,
  2422. 'task_type': 'classification',
  2423. 'ave_node_num': 95.0,
  2424. 'ave_edge_num': 172.93,
  2425. 'node_labeled': False,
  2426. 'edge_labeled': False,
  2427. 'node_attr_dim': 15,
  2428. 'geometry': None,
  2429. 'edge_attr_dim': 0,
  2430. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/Synthie.zip',
  2431. 'domain': 'synthetic',
  2432. },
  2433. 'TRIANGLES': {
  2434. 'database': 'tudataset',
  2435. 'reference': '[27]',
  2436. 'dataset_size': 45000,
  2437. 'class_number': 10,
  2438. 'task_type': 'classification',
  2439. 'ave_node_num': 20.85,
  2440. 'ave_edge_num': 32.74,
  2441. 'node_labeled': False,
  2442. 'edge_labeled': False,
  2443. 'node_attr_dim': 0,
  2444. 'geometry': None,
  2445. 'edge_attr_dim': 0,
  2446. 'url': 'https://www.chrsmrrs.com/graphkerneldatasets/TRIANGLES.zip',
  2447. 'domain': 'synthetic',
  2448. },
  2449. }
  2450. DATASET_META = {**GREYC_META, **IAM_META, **TUDataset_META}
  2451. def list_of_databases():
  2452. """List names of all databases.
  2453. Returns
  2454. -------
  2455. list
  2456. The list of all databases.
  2457. """
  2458. return [i for i in DATABASES]
  2459. def list_of_datasets():
  2460. """List names of all datasets.
  2461. Returns
  2462. -------
  2463. list
  2464. The list of all datasets.
  2465. """
  2466. return [i for i in DATASET_META]

A Python package for graph kernels, graph edit distances and graph pre-image problem.