You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

mnist_attack_nes.py 5.1 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162
  1. # Copyright 2019 Huawei Technologies Co., Ltd
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License");
  4. # you may not use this file except in compliance with the License.
  5. # You may obtain a copy of the License at
  6. #
  7. # http://www.apache.org/licenses/LICENSE-2.0
  8. #
  9. # Unless required by applicable law or agreed to in writing, software
  10. # distributed under the License is distributed on an "AS IS" BASIS,
  11. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. # See the License for the specific language governing permissions and
  13. # limitations under the License.
  14. import sys
  15. import numpy as np
  16. from mindspore import Tensor
  17. from mindspore import context
  18. from mindspore.train.serialization import load_checkpoint, load_param_into_net
  19. from lenet5_net import LeNet5
  20. from mindarmour.attacks.black.black_model import BlackModel
  21. from mindarmour.attacks.black.natural_evolutionary_strategy import NES
  22. from mindarmour.utils.logger import LogUtil
  23. sys.path.append("..")
  24. from data_processing import generate_mnist_dataset
  25. LOGGER = LogUtil.get_instance()
  26. LOGGER.set_level('INFO')
  27. TAG = 'HopSkipJumpAttack'
  28. class ModelToBeAttacked(BlackModel):
  29. """model to be attack"""
  30. def __init__(self, network):
  31. super(ModelToBeAttacked, self).__init__()
  32. self._network = network
  33. def predict(self, inputs):
  34. """predict"""
  35. if len(inputs.shape) == 3:
  36. inputs = inputs[np.newaxis, :]
  37. result = self._network(Tensor(inputs.astype(np.float32)))
  38. return result.asnumpy()
  39. def random_target_labels(true_labels, labels_list):
  40. target_labels = []
  41. for label in true_labels:
  42. while True:
  43. target_label = np.random.choice(labels_list)
  44. if target_label != label:
  45. target_labels.append(target_label)
  46. break
  47. return target_labels
  48. def _pseudorandom_target(index, total_indices, true_class):
  49. """ pseudo random_target """
  50. rng = np.random.RandomState(index)
  51. target = true_class
  52. while target == true_class:
  53. target = rng.randint(0, total_indices)
  54. return target
  55. def create_target_images(dataset, data_labels, target_labels):
  56. res = []
  57. for label in target_labels:
  58. for data_label, data in zip(data_labels, dataset):
  59. if data_label == label:
  60. res.append(data)
  61. break
  62. return np.array(res)
  63. def test_nes_mnist_attack():
  64. """
  65. hsja-Attack test
  66. """
  67. # upload trained network
  68. ckpt_name = './trained_ckpt_file/checkpoint_lenet-10_1875.ckpt'
  69. net = LeNet5()
  70. load_dict = load_checkpoint(ckpt_name)
  71. load_param_into_net(net, load_dict)
  72. net.set_train(False)
  73. # get test data
  74. data_list = "./MNIST_unzip/test"
  75. batch_size = 32
  76. ds = generate_mnist_dataset(data_list, batch_size=batch_size)
  77. # prediction accuracy before attack
  78. model = ModelToBeAttacked(net)
  79. # the number of batches of attacking samples
  80. batch_num = 5
  81. test_images = []
  82. test_labels = []
  83. predict_labels = []
  84. i = 0
  85. for data in ds.create_tuple_iterator():
  86. i += 1
  87. images = data[0].astype(np.float32)
  88. labels = data[1]
  89. test_images.append(images)
  90. test_labels.append(labels)
  91. pred_labels = np.argmax(model.predict(images), axis=1)
  92. predict_labels.append(pred_labels)
  93. if i >= batch_num:
  94. break
  95. predict_labels = np.concatenate(predict_labels)
  96. true_labels = np.concatenate(test_labels)
  97. accuracy = np.mean(np.equal(predict_labels, true_labels))
  98. LOGGER.info(TAG, "prediction accuracy before attacking is : %s",
  99. accuracy)
  100. test_images = np.concatenate(test_images)
  101. # attacking
  102. scene = 'Query_Limit'
  103. if scene == 'Query_Limit':
  104. top_k = -1
  105. elif scene == 'Partial_Info':
  106. top_k = 5
  107. elif scene == 'Label_Only':
  108. top_k = 5
  109. success = 0
  110. queries_num = 0
  111. nes_instance = NES(model, scene, top_k=top_k)
  112. test_length = 32
  113. advs = []
  114. for img_index in range(test_length):
  115. # Initial image and class selection
  116. initial_img = test_images[img_index]
  117. orig_class = true_labels[img_index]
  118. initial_img = [initial_img]
  119. target_class = random_target_labels([orig_class], true_labels)
  120. target_image = create_target_images(test_images, true_labels,
  121. target_class)
  122. nes_instance.set_target_images(target_image)
  123. tag, adv, queries = nes_instance.generate(initial_img, target_class)
  124. if tag[0]:
  125. success += 1
  126. queries_num += queries[0]
  127. advs.append(adv)
  128. advs = np.reshape(advs, (len(advs), 1, 32, 32))
  129. adv_pred = np.argmax(model.predict(advs), axis=1)
  130. adv_accuracy = np.mean(np.equal(adv_pred, true_labels[:test_length]))
  131. LOGGER.info(TAG, "prediction accuracy after attacking is : %s",
  132. adv_accuracy)
  133. if __name__ == '__main__':
  134. # device_target can be "CPU", "GPU" or "Ascend"
  135. context.set_context(mode=context.GRAPH_MODE, device_target="CPU")
  136. test_nes_mnist_attack()

MindArmour关注AI的安全和隐私问题。致力于增强模型的安全可信、保护用户的数据隐私。主要包含3个模块:对抗样本鲁棒性模块、Fuzz Testing模块、隐私保护与评估模块。 对抗样本鲁棒性模块 对抗样本鲁棒性模块用于评估模型对于对抗样本的鲁棒性,并提供模型增强方法用于增强模型抗对抗样本攻击的能力,提升模型鲁棒性。对抗样本鲁棒性模块包含了4个子模块:对抗样本的生成、对抗样本的检测、模型防御、攻防评估。