You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

buddy.cc 12 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384
  1. /**
  2. * Copyright 2019 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "minddata/dataset/util/buddy.h"
  17. #include <iomanip>
  18. #include <stdexcept>
  19. #include "minddata/dataset/util/memory_pool.h"
  20. #include "minddata/dataset/util/system_pool.h"
  21. #include "utils/log_adapter.h"
  22. #include "./securec.h"
  23. inline uint64_t BitLeftShift(uint64_t v, uint64_t n) { return (v << n); }
  24. inline uint64_t BitRightShift(uint64_t v, uint64_t n) { return (v >> n); }
  25. inline uint64_t BitOr(uint64_t rhs, uint64_t lhs) { return rhs | lhs; }
  26. inline uint64_t BitEx(uint64_t rhs, uint64_t lhs) { return rhs ^ lhs; }
  27. inline uint64_t BitAnd(uint64_t rhs, uint64_t lhs) { return rhs & lhs; }
  28. namespace mindspore {
  29. namespace dataset {
  30. Status BuddySpace::Init() {
  31. if (log_min_ < 0) {
  32. return Status(StatusCode::kUnexpectedError, __LINE__, __FILE__,
  33. "log_min must be positive : " + std::to_string(log_min_));
  34. }
  35. if (num_lvl_ < 3 || num_lvl_ > 18) {
  36. return Status(StatusCode::kUnexpectedError, __LINE__, __FILE__,
  37. "num_lvl must be between 3 and 18 : " + std::to_string(num_lvl_));
  38. }
  39. min_ = BitLeftShift(1, log_min_);
  40. max_ = BitLeftShift(1, log_min_ + num_lvl_ - 1);
  41. size_t offset_1 = sizeof(rel_addr_t) * num_lvl_;
  42. size_t offset_2 = sizeof(int) * num_lvl_ + offset_1;
  43. size_t offset_3 = sizeof(char) * BitLeftShift(1, num_lvl_ - 3) + offset_2;
  44. try {
  45. mem_ = std::make_unique<uint8_t[]>(offset_3);
  46. } catch (const std::bad_alloc &e) {
  47. return Status(StatusCode::kOutOfMemory);
  48. }
  49. (void)memset_s(mem_.get(), offset_3, 0, offset_3);
  50. auto ptr = mem_.get();
  51. hint_ = reinterpret_cast<rel_addr_t *>(ptr);
  52. count_ = reinterpret_cast<int *>((reinterpret_cast<char *>(ptr) + offset_1));
  53. map_ = reinterpret_cast<char *>(ptr) + offset_2;
  54. count_[num_lvl_ - 1] = 1;
  55. map_[0] = BitOr(MORE_BIT, num_lvl_ - 3);
  56. return Status::OK();
  57. }
  58. Status BuddySpace::Alloc(const uint64_t sz, BSpaceDescriptor *desc, addr_t *p) noexcept {
  59. std::lock_guard<std::mutex> lock(mutex_);
  60. addr_t addr = AllocNoLock(sz, desc);
  61. if (addr != NOSPACE) {
  62. *p = addr;
  63. return Status::OK();
  64. } else {
  65. return Status(StatusCode::kBuddySpaceFull, "BuddySpace full. Not an error. Please ignore.");
  66. }
  67. }
  68. addr_t BuddySpace::AllocNoLock(const uint64_t sz, BSpaceDescriptor *desc) noexcept {
  69. MS_ASSERT(sz <= max_);
  70. uint32_t reqSize = SizeToBlock(sz);
  71. rel_addr_t rel_addr = AllocBuddySeg(reqSize);
  72. if (rel_addr != static_cast<rel_addr_t>(NOSPACE)) {
  73. (void)memset_s(desc, sizeof(BSpaceDescriptor), 0, sizeof(BSpaceDescriptor));
  74. desc->sig = static_cast<int>(0xDEADBEEF);
  75. desc->addr = rel_addr;
  76. desc->req_size = reqSize;
  77. desc->blk_size = NextPowerOf2(reqSize);
  78. return static_cast<addr_t>(rel_addr * min_);
  79. } else {
  80. return NOSPACE;
  81. }
  82. }
  83. void BuddySpace::FreeNoLock(const BSpaceDescriptor *desc) {
  84. MS_ASSERT(desc->sig == 0XDEADBEEF);
  85. rel_addr_t rel_addr = desc->addr;
  86. size_t blk_size = desc->blk_size;
  87. size_t req_size = desc->req_size;
  88. FreeBuddySeg(rel_addr, blk_size, req_size);
  89. }
  90. void BuddySpace::Free(const BSpaceDescriptor *desc) {
  91. std::lock_guard<std::mutex> lock(mutex_);
  92. return FreeNoLock(desc);
  93. }
  94. std::ostream &operator<<(std::ostream &os, const BuddySpace &s) {
  95. os << "1 unit = " << s.GetMinSize() << "\n"
  96. << "Size of buddy space = " << s.GetMaxSize() << "\n"
  97. << "Number of levels = " << s.num_lvl_ << "\n\n"
  98. << "Percent free = " << s.PercentFree() << "\n"
  99. << "Dumping count array : "
  100. << "\n";
  101. for (int i = 0; i < s.num_lvl_; i++) {
  102. os << "[" << i << "] = " << s.count_[i] << " ";
  103. if (((i + 1) % 4) == 0) {
  104. os << "\n";
  105. }
  106. }
  107. os << "\n";
  108. os << "Dumping allocation info:"
  109. << "\n";
  110. auto max_addr = static_cast<rel_addr_t>(BitLeftShift(1, s.num_lvl_ - 1));
  111. rel_addr_t addr = 0;
  112. while (addr < max_addr) {
  113. size_t sz = 0;
  114. BuddySpace::STATE st;
  115. s.GetBuddySegState(addr, &sz, &st);
  116. os << "Address : " << std::left << std::setw(8) << addr << " Size : " << std::setw(8) << sz << " State : "
  117. << ((st == BuddySpace::STATE::kAlloc) ? "ALLOC" : ((st == BuddySpace::STATE::kFree) ? "FREE" : "Unkonwn"))
  118. << "\n";
  119. addr += sz;
  120. }
  121. return os;
  122. }
  123. void BuddySpace::GetBuddySegState(const rel_addr_t rel_addr, size_t *rel_sz, STATE *st) const {
  124. char byte;
  125. int pos;
  126. int offset;
  127. uint64_t val = 0;
  128. int shift;
  129. pos = BitRightShift(rel_addr, 2);
  130. offset = rel_addr % 4;
  131. shift = offset * 2;
  132. byte = map_[pos];
  133. switch (offset) {
  134. case 0:
  135. val = byte;
  136. break;
  137. case 1:
  138. case 3:
  139. if (offset == 1) {
  140. val = BitLeftShift(BitAnd(byte, 0x30), shift);
  141. } else {
  142. val = BitLeftShift(BitAnd(byte, 0x03), shift);
  143. }
  144. break;
  145. case 2:
  146. val = BitLeftShift(BitAnd(byte, 0x0F), shift);
  147. break;
  148. }
  149. if (BitAnd(val, ONE_BIT)) {
  150. *rel_sz = 1;
  151. } else if (BitAnd(val, TWO_BIT)) {
  152. *rel_sz = 2;
  153. } else if (BitAnd(val, MORE_BIT)) {
  154. log_t lg = BitAnd(val, 0x0F);
  155. *rel_sz = BitLeftShift(1, lg + 2);
  156. } else {
  157. *st = STATE::kEmpty;
  158. return;
  159. }
  160. *st = BitAnd(val, ALLOC_BIT) ? STATE::kAlloc : STATE::kFree;
  161. }
  162. void BuddySpace::SetBuddySegState(rel_addr_t rel_addr, size_t rel_sz, STATE st) {
  163. int clr;
  164. int mask;
  165. int pos;
  166. int offset;
  167. int val = 0;
  168. int shift;
  169. auto log_sz = static_cast<log_t>(Log2(rel_sz));
  170. pos = BitRightShift(rel_addr, 2);
  171. offset = rel_addr % 4;
  172. shift = offset * 2;
  173. if (rel_sz == 1) {
  174. val = ONE_BIT;
  175. mask = 0xC0;
  176. } else if (rel_sz == 2) {
  177. val = TWO_BIT;
  178. mask = 0xF0;
  179. } else {
  180. val = BitOr(log_sz - 2, MORE_BIT);
  181. mask = 0xFF;
  182. }
  183. if (st == STATE::kAlloc) {
  184. val = BitOr(val, ALLOC_BIT);
  185. } else if (st == STATE::kFree) {
  186. val = BitAnd(val, ~(static_cast<uint64_t>(ALLOC_BIT)));
  187. } else if (st == STATE::kEmpty) {
  188. val = 0;
  189. }
  190. clr = static_cast<int>(~(BitRightShift(mask, shift)));
  191. map_[pos] = static_cast<char>(BitAnd(map_[pos], clr));
  192. map_[pos] = static_cast<char>(BitOr(map_[pos], BitRightShift(val, shift)));
  193. if (st == STATE::kAlloc) {
  194. count_[log_sz]--;
  195. } else if (st == STATE::kFree) {
  196. count_[log_sz]++;
  197. if (rel_addr < hint_[log_sz]) {
  198. hint_[log_sz] = rel_addr;
  199. }
  200. }
  201. }
  202. void BuddySpace::JoinBuddySeg(rel_addr_t addr, size_t blk_sz) {
  203. while (blk_sz < BitLeftShift(1, num_lvl_)) {
  204. rel_addr_t buddy = BitEx(addr, blk_sz);
  205. size_t sz = 0;
  206. STATE st;
  207. GetBuddySegState(buddy, &sz, &st);
  208. if (st == STATE::kFree && sz == blk_sz) {
  209. auto log_sz = static_cast<log_t>(Log2(blk_sz));
  210. rel_addr_t left = (buddy < addr) ? buddy : addr;
  211. rel_addr_t right = left + blk_sz;
  212. MS_ASSERT(count_[log_sz] >= 2);
  213. count_[log_sz] -= 2;
  214. SetBuddySegState(right, blk_sz, STATE::kEmpty);
  215. SetBuddySegState(left, BitLeftShift(blk_sz, 1), STATE::kFree);
  216. for (int i = 0; i < log_sz; i++) {
  217. if (hint_[i] == right) {
  218. hint_[i] = left;
  219. }
  220. }
  221. addr = left;
  222. blk_sz <<= 1u;
  223. } else {
  224. break;
  225. }
  226. }
  227. }
  228. void BuddySpace::TrimBuddySeg(rel_addr_t addr, size_t blk_sz, size_t ask_sz) {
  229. MS_ASSERT(ask_sz < blk_sz);
  230. uint32_t inx = Log2(blk_sz);
  231. size_t remaining_sz = ask_sz;
  232. for (int i = inx; i > 0; i--) {
  233. size_t b_size = BitLeftShift(1, i);
  234. size_t half_sz = BitRightShift(b_size, 1);
  235. count_[i]--;
  236. SetBuddySegState(addr, half_sz, STATE::kFree);
  237. SetBuddySegState(addr + half_sz, half_sz, STATE::kFree);
  238. if (remaining_sz >= half_sz) {
  239. SetBuddySegState(addr, half_sz, STATE::kAlloc);
  240. remaining_sz -= half_sz;
  241. if (remaining_sz == 0) {
  242. break;
  243. }
  244. addr += half_sz;
  245. }
  246. }
  247. }
  248. void BuddySpace::UnTrimBuddySeg(rel_addr_t addr, size_t blk_sz, size_t ask_sz) {
  249. MS_ASSERT(ask_sz < blk_sz);
  250. uint32_t inx = Log2(blk_sz);
  251. size_t remaining_sz = ask_sz;
  252. for (int i = inx; i > 0; i--) {
  253. size_t b_size = BitLeftShift(1, i);
  254. size_t half_sz = BitRightShift(b_size, 1);
  255. if (remaining_sz >= half_sz) {
  256. #ifdef DEBUG
  257. {
  258. size_t sz = 0;
  259. STATE st;
  260. GetBuddySegState(addr, &sz, &st);
  261. MS_ASSERT(sz == half_sz && st == STATE::kAlloc);
  262. }
  263. #endif
  264. SetBuddySegState(addr, half_sz, STATE::kFree);
  265. remaining_sz -= half_sz;
  266. if (remaining_sz == 0) {
  267. JoinBuddySeg(addr, half_sz);
  268. break;
  269. }
  270. addr += half_sz;
  271. }
  272. }
  273. }
  274. rel_addr_t BuddySpace::AllocBuddySeg(uint32_t req_size) noexcept {
  275. uint32_t blk_size = NextPowerOf2(req_size);
  276. int start_inx = static_cast<int>(Log2(blk_size));
  277. bool found = false;
  278. rel_addr_t ask_addr = 0;
  279. auto max_addr = static_cast<rel_addr_t>(BitLeftShift(1, num_lvl_ - 1));
  280. STATE st;
  281. size_t sz = 0;
  282. for (int i = start_inx; !found && i < num_lvl_; i++) {
  283. MS_ASSERT(count_[i] >= 0);
  284. if (count_[i] == 0) {
  285. continue;
  286. }
  287. auto blk_sz = static_cast<size_t>(BitLeftShift(1, i));
  288. ask_addr = hint_[i];
  289. while (ask_addr < max_addr && !found) {
  290. GetBuddySegState(ask_addr, &sz, &st);
  291. if (st == STATE::kFree && sz == blk_sz) {
  292. found = true;
  293. } else {
  294. MS_ASSERT(st != STATE::kEmpty);
  295. ask_addr += ((sz > blk_sz) ? sz : blk_sz);
  296. }
  297. }
  298. }
  299. if (found) {
  300. if (sz > req_size) {
  301. TrimBuddySeg(ask_addr, sz, req_size);
  302. } else {
  303. SetBuddySegState(ask_addr, sz, STATE::kAlloc);
  304. hint_[start_inx] = ask_addr;
  305. }
  306. return ask_addr;
  307. } else {
  308. return static_cast<rel_addr_t>(NOSPACE);
  309. }
  310. }
  311. void BuddySpace::FreeBuddySeg(rel_addr_t addr, size_t blk_size, size_t req_size) {
  312. if (req_size == blk_size) {
  313. #ifdef DEBUG
  314. {
  315. size_t sz = 0;
  316. STATE st;
  317. GetBuddySegState(addr, &sz, &st);
  318. }
  319. #endif
  320. SetBuddySegState(addr, blk_size, STATE::kFree);
  321. JoinBuddySeg(addr, blk_size);
  322. } else {
  323. UnTrimBuddySeg(addr, blk_size, req_size);
  324. }
  325. }
  326. int BuddySpace::PercentFree() const {
  327. uint64_t total_free_sz = 0;
  328. uint64_t max_sz_in_unit = BitLeftShift(1, num_lvl_ - 1);
  329. // Go through the count array without lock
  330. for (int i = 0; i < num_lvl_; i++) {
  331. int cnt = count_[i];
  332. if (cnt == 0) {
  333. continue;
  334. }
  335. uint64_t blk_sz = BitLeftShift(1, i);
  336. total_free_sz += (blk_sz * cnt);
  337. }
  338. return static_cast<int>(static_cast<float>(total_free_sz) / static_cast<float>(max_sz_in_unit) * 100);
  339. }
  340. BuddySpace::BuddySpace(int log_min, int num_lvl)
  341. : hint_(nullptr), count_(nullptr), map_(nullptr), log_min_(log_min), num_lvl_(num_lvl), min_(0), max_(0) {}
  342. BuddySpace::~BuddySpace() {
  343. hint_ = nullptr;
  344. count_ = nullptr;
  345. map_ = nullptr;
  346. }
  347. Status BuddySpace::CreateBuddySpace(std::unique_ptr<BuddySpace> *out_bs, int log_min, int num_lvl) {
  348. Status rc;
  349. auto bs = new (std::nothrow) BuddySpace(log_min, num_lvl);
  350. if (bs == nullptr) {
  351. return Status(StatusCode::kOutOfMemory);
  352. }
  353. rc = bs->Init();
  354. if (rc.IsOk()) {
  355. (*out_bs).reset(bs);
  356. } else {
  357. delete bs;
  358. }
  359. return rc;
  360. }
  361. } // namespace dataset
  362. } // namespace mindspore