You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

build_test_detection_algorithm_PyodSoGaal.py 2.2 kB

intial commit Former-commit-id: 94043c2300f8ed1f7d676612700421a5183ff32e [formerly b45733a1d000ab3045d6f38d6118be345f835a45] [formerly d5042bb1361c9d75d644dfc3eedc004d3dcc4dca [formerly 51bb45768e19583c06d611610d26c7c2a04b181a]] [formerly 95ffadd6d860e1f3380c089f513b735fa3fddbf5 [formerly e90788f72939b4885271198c8260feca74c1b3af] [formerly 4baa1bbd360d23adfa8dba0aea20a9e67cbe7f6b [formerly e7c713266cc151eb60ab07751720dadf7bb52133]]] [formerly 772bf095ea019fb7d3f33964e678326ac5be620a [formerly d03cf02caa122a742ddd7b61f7ed4a1fa551d840] [formerly fea615997e5ed4c0561ad88767a0b6f8bd9b4666 [formerly fcae9cb8b6ad50e3f830449a118325f8b62f4d8d]] [formerly b8967be9621245419b7b5bee1b18f6974d340a85 [formerly 55dbea29edf58c39bad8cd8a9bf2358722dd9df1] [formerly 5f76bf379a704e6ca30a32d0394b679eaca433e4 [formerly 25720b71213364ebdf13d5b6b2700aaf8037a6a8]]]] [formerly 5d0c719dce4a0c713337d6cd052e16455b2bbaf0 [formerly f5dbbf1595ae57beb49de4ae616cff731be1cdd7] [formerly 836b4006c709579450d4107e1f8145ba0f09adc7 [formerly 7e18c6b3330e70c01a42fa130cfd8695051cac82]] [formerly 7e836793075e02ba49c444518c3376057ebb378c [formerly 3f42064f1e3821a1745b7fe8ae01046406ca383f] [formerly dcdf152eeab68e09fd006acf6bb5f420f7f75738 [formerly 28079a22ff9994e13d6c6fa60c4cce8a7375d7e5]]] [formerly 103942552aa9e77bd1cf6e52a2f9378cb23661f0 [formerly 4a083d8357e7de9e3ea41137549c41d2c3f07ec4] [formerly 3faae413507425f454e2d274ae987f535a07f9c6 [formerly a9cf74645861b8b08897084769508bcc1a1204a0]] [formerly f7a29ee08b2c0c57ba95f4879a534330eea4db2b [formerly 74f3ddb1cb29da8ee00163ccecc6bbc8c8502995] [formerly 8080c82fc1f574939594ac2ba4e52f7be01813ce [formerly 527e8c2ab36d902a68f17b0f98233938909f5a6d]]]]] [formerly 9c40821770d672749081d7941613e421f6d0b372 [formerly a0a0b218c0daaf35243b13d5568c5555b6256c15] [formerly 1a6449b3da9592753ed56d712ddb9a569927708f [formerly f28562eed42d64950c30b74684dcc23669855e21]] [formerly 6d2aa951248c19e39f2bd6a1b845798ce4288e03 [formerly fe33e93915c1afe5fecbc1bc4e057f10949ac4ed] [formerly 4fc4c5d6936f27e7446e0b84bfaab4b06236342c [formerly 595c3bc4683593003480a8101c594b1baa3c56d0]]] [formerly d041990a94b005b6f3e64877db9830945ccc7602 [formerly 8928771710d8e329946b2f0d489c69f95b132090] [formerly 6ce7b1b42aa9662cd15db1980afd83fdd04e7b00 [formerly 04df89fd7ee159470e419020fc12d315132173d7]] [formerly 6a0bfe64a94a23b7cfb056c0e7662b2185e6030c [formerly e3484903429a1cfb3953061d979299663dd2cf7f] [formerly 8ff59698a34a4b5753e6b5246a36cbf46b8e7a17 [formerly 45034f2ad26dc97dcc5294579223cdc731df0830]]]] [formerly c382eece4528c1f892e9c85888eda2a6841b98c5 [formerly 9a3e9804d38f60ef94af9752c84541af041692d5] [formerly c6dd56bdfb9bda63e21ca915010ca341490370d9 [formerly 4316d74e908debdb20b5f911126796295685fa0f]] [formerly cd5cc08abfa003938ceec8505315d3a337eca638 [formerly df4670ec947a0dfe0fa022481cd33f95fac4515e] [formerly a3920bd132c271a0df677c33a64a98c59205a913 [formerly 43850829262f4b5e27d60259caa188ab76102690]]] [formerly f2d68829faec7163a23dc0552faf522bdd17bf44 [formerly d617b51f8ed4896ff07ec99170bab747da67115c] [formerly 2c0363e76139fd557654da8ae160491010c3c254 [formerly d30774ccb9b7e3dbd97536a83f2d41c38971e216]] [formerly 1aefdb7a6d1ec0e5f8ad3682c8aaa7fa65200bc0 [formerly 0983b312de7d42cd159134d891f4d67646df376e] [formerly 16af77255b1e008f20dd4dba4ec9f119c2efc6bc [formerly 351d94a1a085d941f36fc7b0d972808b6aa5562e]]]]]] Former-commit-id: 0aac720ed915c5217616f5e245f26aa9343a4d98 [formerly 4c9b0637b00704e8b71835c46bc3e3e83e014630] [formerly e7ab703570838b27d396aa047782d8cccb537f03 [formerly 065727f4b8a5801d15afd2b91fcfce2b42e244f3]] [formerly a919abf3ebf5f473d10f3392ddba67d54657f294 [formerly 6fa494b0b32eb41c6990da0c791b8dee1925e459] [formerly d7e6376187c4b324a898f0a196888fe85d4832a1 [formerly ceee8b5ad677746fe4ff9b73aef020150ca4814b]]] [formerly 8135d4aaf571470296ee135c1dcd554d823096ff [formerly 0477e8c3775b95022a8236a17b68a899e3e36ad0] [formerly 78272aa1a38dcacfafcc64e00e7c43baadf2312a [formerly 43b5408fd257f569355f6db4aad80a13a01dd4d1]] [formerly 8364ea76fab1d7cc00865851b8ddee5470ff6a00 [formerly 14305a7625964855833da7722453f746c41e9989] [formerly 3f6573a401ab18783ed4b87461eb2f8912333c7f [formerly c56850302d11ba87fe5a58d1651a1f80559cc3b8]]]] [formerly 4e2575e559fc0e853565324819ee22b207c611ba [formerly d8068f502691af1123a878a4099c33c3eab6201c] [formerly e51a3dd42fb3f4fd9fb15006b8201487f6a0f9d1 [formerly 81dd7e2f1d4b73a47d7e2e8ca501e98f4c59e5a1]] [formerly f604061af2b80906784d5d3a8dde03a6f7a2dfa2 [formerly e407b5d0b1d393a0dd4eec1fb54d718ff40cda39] [formerly 8d3602120d6406a4d3d139b17e1b2e73cf13b1f3 [formerly e563b7e7c551a2313e07d4d08e50f181c29172d7]]] [formerly aab553bb2f4be77f9123932ac6be519671f862ae [formerly 631d8d76c34a457e48e4055dd3616c945507162d] [formerly 1cec7b5f2f5d1b97ad657b8dc7a8ced100b34ff9 [formerly 945f34dbca68c3b9ee3c0e14fb19cd010f4670a3]] [formerly 080e18f0be8b6bf3adb7b953272e36998fa2562a [formerly f1132fa762a1232558c7ce18361687caf079305b] [formerly 16af77255b1e008f20dd4dba4ec9f119c2efc6bc]]]] Former-commit-id: ff7eb7ad1865310dc4622b5e989481d8e310ef08 [formerly e2e1163ef1ffae29d02ba78fd6b638103a07ea80] [formerly abc1fff948774fff8b34a8495551d49273f7e3d5 [formerly da6d629afa117ab8844235eadaf27286820c6398]] [formerly ff7dfe520b20803d969820dce67e0d59c1c81991 [formerly 015cc45265c6cb41598ae070e97cc7c64bc8148b] [formerly 8f9148b059ddcedfd3c43a53d881b95034ff01e4 [formerly 4d8370bc4514c6724cd6beb5855d1345c24d9a1c]]] [formerly be941c6dc41dd0a97692c4767657c3549051c11a [formerly dde58294984f723486c7a52e1e07a79bd6f0971e] [formerly 69d9c1a20a6b67623bf315359a8a49638a564e3c [formerly fcc8faa99322b698e34cb61e118e50fc68bc7a45]] [formerly 71bb6b09def26ec2dee4340a6d7af101846fc5c8 [formerly 7cb44f0d9d184d43e6dbf8081853ab88c479e577] [formerly 282bb412613c4ac759d8fa2f8a960935978c0511 [formerly 6d9106988971fce22763242d9c0017e16d1d4fc2]]]] Former-commit-id: e5a920084c8dc03117d73b27bb4776b9b9b4fe4d [formerly e8ac010da9dc53fb1de4d8287d48ae15dff2b8bc] [formerly dc836f921f454728d1987e9b8f90968d0d19f7c7 [formerly 6fbd3b41e4ca7c94956536012a7e7d8617612f50]] [formerly 710c662c1423b614a47481a625114dc6e5bc47d9 [formerly 737958f86dad54fc51d487e8ad08bebc63096806] [formerly b38a85b15158c020114ef013400f74fc4b0e76d0 [formerly e9ce6a2129327c275c1dc6e06e2545a1c4929759]]] Former-commit-id: 46f2a522ddf879112539d13753985f079d416ad4 [formerly ba84173dab2fe91ad2766482689836708c49f7de] [formerly 7990bdcb4c348a53c612c5244331f14d3ace2ea0 [formerly b6dc6ec409b20d439d2963473d3d37b38cb55b16]] Former-commit-id: 90c1b4b06eb7da5638b2cb73219910b904d8596c [formerly aab646e394843e53c2ecaea90fe286a5f2b38841] Former-commit-id: 7532188e1b60dd2bd4853544e9a998d1d3ff74d4
5 years ago
1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950
  1. from d3m import index
  2. from d3m.metadata.base import ArgumentType
  3. from d3m.metadata.pipeline import Pipeline, PrimitiveStep
  4. from d3m.metadata import hyperparams
  5. import copy
  6. # -> dataset_to_dataframe -> column_parser -> extract_columns_by_semantic_types(attributes) -> imputer -> random_forest
  7. # extract_columns_by_semantic_types(targets) -> ^
  8. # Creating pipeline
  9. pipeline_description = Pipeline()
  10. pipeline_description.add_input(name='inputs')
  11. # Step 0: dataset_to_dataframe
  12. primitive_0 = index.get_primitive('d3m.primitives.tods.data_processing.dataset_to_dataframe')
  13. step_0 = PrimitiveStep(primitive=primitive_0)
  14. step_0.add_argument(name='inputs', argument_type=ArgumentType.CONTAINER, data_reference='inputs.0')
  15. step_0.add_output('produce')
  16. pipeline_description.add_step(step_0)
  17. # # Step 1: column_parser
  18. primitive_1 = index.get_primitive('d3m.primitives.tods.data_processing.column_parser')
  19. step_1 = PrimitiveStep(primitive=primitive_1)
  20. step_1.add_argument(name='inputs', argument_type=ArgumentType.CONTAINER, data_reference='steps.0.produce')
  21. step_1.add_output('produce')
  22. pipeline_description.add_step(step_1)
  23. # # Step 2: test primitive
  24. primitive_2 = index.get_primitive('d3m.primitives.tods.detection_algorithm.pyod_sogaal')
  25. step_2 = PrimitiveStep(primitive=primitive_2)
  26. step_2.add_hyperparameter(name='contamination', argument_type=ArgumentType.VALUE, data=0.1)
  27. step_2.add_hyperparameter(name='use_semantic_types', argument_type=ArgumentType.VALUE, data=True)
  28. step_2.add_hyperparameter(name='use_columns', argument_type=ArgumentType.VALUE, data=(2,)) # There is sth wrong with multi-dimensional
  29. step_2.add_hyperparameter(name='return_result', argument_type=ArgumentType.VALUE, data='append')
  30. step_2.add_argument(name='inputs', argument_type=ArgumentType.CONTAINER, data_reference='steps.1.produce')
  31. step_2.add_output('produce')
  32. pipeline_description.add_step(step_2)
  33. # Final Output
  34. pipeline_description.add_output(name='output predictions', data_reference='steps.2.produce')
  35. # Output to YAML
  36. yaml = pipeline_description.to_yaml()
  37. with open('pipeline.yml', 'w') as f:
  38. f.write(yaml)
  39. print(yaml)
  40. # Or you can output json
  41. #data = pipline_description.to_json()

全栈的自动化机器学习系统,主要针对多变量时间序列数据的异常检测。TODS提供了详尽的用于构建基于机器学习的异常检测系统的模块,它们包括:数据处理(data processing),时间序列处理( time series processing),特征分析(feature analysis),检测算法(detection algorithms),和强化模块( reinforcement module)。这些模块所提供的功能包括常见的数据预处理、时间序列数据的平滑或变换,从时域或频域中抽取特征、多种多样的检测算