You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

datasetDoc.json 4.2 kB

first commit Former-commit-id: 08bc23ba02cffbce3cf63962390a65459a132e48 [formerly 0795edd4834b9b7dc66db8d10d4cbaf42bbf82cb] [formerly b5010b42541add7e2ea2578bf2da537efc457757 [formerly a7ca09c2c34c4fc8b3d8e01fcfa08eeeb2cae99d]] [formerly 615058473a2177ca5b89e9edbb797f4c2a59c7e5 [formerly 743d8dfc6843c4c205051a8ab309fbb2116c895e] [formerly bb0ea98b1e14154ef464e2f7a16738705894e54b [formerly 960a69da74b81ef8093820e003f2d6c59a34974c]]] [formerly 2fa3be52c1b44665bc81a7cc7d4cea4bbf0d91d5 [formerly 2054589f0898627e0a17132fd9d4cc78efc91867] [formerly 3b53730e8a895e803dfdd6ca72bc05e17a4164c1 [formerly 8a2fa8ab7baf6686d21af1f322df46fd58c60e69]] [formerly 87d1e3a07a19d03c7d7c94d93ab4fa9f58dada7c [formerly f331916385a5afac1234854ee8d7f160f34b668f] [formerly 69fb3c78a483343f5071da4f7e2891b83a49dd18 [formerly 386086f05aa9487f65bce2ee54438acbdce57650]]]] Former-commit-id: a00aed8c934a6460c4d9ac902b9a74a3d6864697 [formerly 26fdeca29c2f07916d837883983ca2982056c78e] [formerly 0e3170d41a2f99ecf5c918183d361d4399d793bf [formerly 3c12ad4c88ac5192e0f5606ac0d88dd5bf8602dc]] [formerly d5894f84f2fd2e77a6913efdc5ae388cf1be0495 [formerly ad3e7bc670ff92c992730d29c9d3aa1598d844e8] [formerly 69fb3c78a483343f5071da4f7e2891b83a49dd18]] Former-commit-id: 3c19c9fae64f6106415fbc948a4dc613b9ee12f8 [formerly 467ddc0549c74bb007e8f01773bb6dc9103b417d] [formerly 5fa518345d958e2760e443b366883295de6d991c [formerly 3530e130b9fdb7280f638dbc2e785d2165ba82aa]] Former-commit-id: 9f5d473d42a435ec0d60149939d09be1acc25d92 [formerly be0b25c4ec2cde052a041baf0e11f774a158105d] Former-commit-id: 9eca71cb73ba9edccd70ac06a3b636b8d4093b04
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200
  1. {
  2. "about": {
  3. "datasetID": "database_dataset_1",
  4. "datasetName": "A dataset simulating a database dump",
  5. "description": "A synthetic dataset trying to be similar to a database dump, with tables with different relations between them.",
  6. "license": "CC",
  7. "datasetSchemaVersion": "4.0.0",
  8. "redacted": false,
  9. "datasetVersion": "4.0.0",
  10. "digest": "044b0c8724c80f672fb5a6e233b154d3342e4528de9a0245df77066f770c3d8f"
  11. },
  12. "dataResources": [
  13. {
  14. "resID": "codes",
  15. "resPath": "tables/codes.csv",
  16. "resType": "table",
  17. "resFormat": {
  18. "text/csv": [
  19. "csv"
  20. ]
  21. },
  22. "isCollection": false,
  23. "columnsCount": 3,
  24. "columns": [
  25. {
  26. "colIndex": 0,
  27. "colName": "code",
  28. "colType": "categorical",
  29. "role": [
  30. "index"
  31. ]
  32. },
  33. {
  34. "colIndex": 1,
  35. "colName": "name",
  36. "colType": "string",
  37. "role": [
  38. "attribute"
  39. ]
  40. },
  41. {
  42. "colIndex": 2,
  43. "colName": "author",
  44. "colType": "integer",
  45. "role": [
  46. "attribute"
  47. ],
  48. "refersTo": {
  49. "resID": "authors",
  50. "resObject": {
  51. "columnIndex": 0
  52. }
  53. }
  54. }
  55. ]
  56. },
  57. {
  58. "resID": "authors",
  59. "resPath": "tables/authors.csv",
  60. "resType": "table",
  61. "resFormat": {
  62. "text/csv": [
  63. "csv"
  64. ]
  65. },
  66. "isCollection": false,
  67. "columnsCount": 2,
  68. "columns": [
  69. {
  70. "colIndex": 0,
  71. "colName": "id",
  72. "colType": "integer",
  73. "role": [
  74. "index"
  75. ]
  76. },
  77. {
  78. "colIndex": 1,
  79. "colName": "name",
  80. "colType": "string",
  81. "role": [
  82. "attribute"
  83. ]
  84. }
  85. ]
  86. },
  87. {
  88. "resID": "values",
  89. "resPath": "tables/values.csv",
  90. "resType": "table",
  91. "resFormat": {
  92. "text/csv": [
  93. "csv"
  94. ]
  95. },
  96. "isCollection": false,
  97. "columnsCount": 4,
  98. "columns": [
  99. {
  100. "colIndex": 0,
  101. "colName": "code",
  102. "colType": "categorical",
  103. "role": [
  104. "attribute"
  105. ],
  106. "refersTo": {
  107. "resID": "codes",
  108. "resObject": {
  109. "columnName": "code"
  110. }
  111. }
  112. },
  113. {
  114. "colIndex": 1,
  115. "colName": "key",
  116. "colType": "categorical",
  117. "role": [
  118. "attribute"
  119. ]
  120. },
  121. {
  122. "colIndex": 2,
  123. "colName": "year",
  124. "colType": "dateTime",
  125. "role": [
  126. "attribute"
  127. ]
  128. },
  129. {
  130. "colIndex": 3,
  131. "colName": "value",
  132. "colType": "real",
  133. "role": [
  134. "attribute"
  135. ]
  136. }
  137. ]
  138. },
  139. {
  140. "resID": "learningData",
  141. "resPath": "tables/learningData.csv",
  142. "resType": "table",
  143. "resFormat": {
  144. "text/csv": [
  145. "csv"
  146. ]
  147. },
  148. "isCollection": false,
  149. "columnsCount": 5,
  150. "columns": [
  151. {
  152. "colIndex": 0,
  153. "colName": "d3mIndex",
  154. "colType": "integer",
  155. "role": [
  156. "index"
  157. ]
  158. },
  159. {
  160. "colIndex": 1,
  161. "colName": "code",
  162. "colType": "categorical",
  163. "role": [
  164. "attribute"
  165. ],
  166. "refersTo": {
  167. "resID": "codes",
  168. "resObject": {
  169. "columnName": "code"
  170. }
  171. }
  172. },
  173. {
  174. "colIndex": 2,
  175. "colName": "key",
  176. "colType": "categorical",
  177. "role": [
  178. "attribute"
  179. ]
  180. },
  181. {
  182. "colIndex": 3,
  183. "colName": "year",
  184. "colType": "dateTime",
  185. "role": [
  186. "attribute"
  187. ]
  188. },
  189. {
  190. "colIndex": 4,
  191. "colName": "value",
  192. "colType": "real",
  193. "role": [
  194. "suggestedTarget"
  195. ]
  196. }
  197. ]
  198. }
  199. ]
  200. }

全栈的自动化机器学习系统,主要针对多变量时间序列数据的异常检测。TODS提供了详尽的用于构建基于机器学习的异常检测系统的模块,它们包括:数据处理(data processing),时间序列处理( time series processing),特征分析(feature analysis),检测算法(detection algorithms),和强化模块( reinforcement module)。这些模块所提供的功能包括常见的数据预处理、时间序列数据的平滑或变换,从时域或频域中抽取特征、多种多样的检测算

Contributors (1)