You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

buddy.cc 12 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383
  1. /**
  2. * Copyright 2019 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "minddata/dataset/util/buddy.h"
  17. #include <iomanip>
  18. #include <stdexcept>
  19. #include "minddata/dataset/util/memory_pool.h"
  20. #include "minddata/dataset/util/log_adapter.h"
  21. inline uint64_t BitLeftShift(uint64_t v, uint64_t n) { return (v << n); }
  22. inline uint64_t BitRightShift(uint64_t v, uint64_t n) { return (v >> n); }
  23. inline uint64_t BitOr(uint64_t rhs, uint64_t lhs) { return rhs | lhs; }
  24. inline uint64_t BitEx(uint64_t rhs, uint64_t lhs) { return rhs ^ lhs; }
  25. inline uint64_t BitAnd(uint64_t rhs, uint64_t lhs) { return rhs & lhs; }
  26. namespace mindspore {
  27. namespace dataset {
  28. Status BuddySpace::Init() {
  29. if (log_min_ < 0) {
  30. return Status(StatusCode::kMDUnexpectedError, __LINE__, __FILE__,
  31. "log_min must be positive : " + std::to_string(log_min_));
  32. }
  33. if (num_lvl_ < 3 || num_lvl_ > 18) {
  34. return Status(StatusCode::kMDUnexpectedError, __LINE__, __FILE__,
  35. "num_lvl must be between 3 and 18 : " + std::to_string(num_lvl_));
  36. }
  37. min_ = BitLeftShift(1, log_min_);
  38. max_ = BitLeftShift(1, log_min_ + num_lvl_ - 1);
  39. size_t offset_1 = sizeof(rel_addr_t) * num_lvl_;
  40. size_t offset_2 = sizeof(int) * num_lvl_ + offset_1;
  41. size_t offset_3 = sizeof(char) * BitLeftShift(1, num_lvl_ - 3) + offset_2;
  42. try {
  43. mem_ = std::make_unique<uint8_t[]>(offset_3);
  44. } catch (const std::bad_alloc &e) {
  45. return Status(StatusCode::kMDOutOfMemory);
  46. }
  47. (void)memset_s(mem_.get(), offset_3, 0, offset_3);
  48. auto ptr = mem_.get();
  49. hint_ = reinterpret_cast<rel_addr_t *>(ptr);
  50. count_ = reinterpret_cast<int *>((reinterpret_cast<char *>(ptr) + offset_1));
  51. map_ = reinterpret_cast<char *>(ptr) + offset_2;
  52. count_[num_lvl_ - 1] = 1;
  53. map_[0] = BitOr(MORE_BIT, num_lvl_ - 3);
  54. return Status::OK();
  55. }
  56. Status BuddySpace::Alloc(const uint64_t sz, BSpaceDescriptor *desc, addr_t *p) noexcept {
  57. std::lock_guard<std::mutex> lock(mutex_);
  58. addr_t addr = AllocNoLock(sz, desc);
  59. if (addr != NOSPACE) {
  60. *p = addr;
  61. return Status::OK();
  62. } else {
  63. return Status(StatusCode::kMDBuddySpaceFull, "BuddySpace full. Not an error. Please ignore.");
  64. }
  65. }
  66. addr_t BuddySpace::AllocNoLock(const uint64_t sz, BSpaceDescriptor *desc) noexcept {
  67. MS_ASSERT(sz <= max_);
  68. uint32_t reqSize = SizeToBlock(sz);
  69. rel_addr_t rel_addr = AllocBuddySeg(reqSize);
  70. if (rel_addr != static_cast<rel_addr_t>(NOSPACE)) {
  71. (void)memset_s(desc, sizeof(BSpaceDescriptor), 0, sizeof(BSpaceDescriptor));
  72. desc->sig = static_cast<int>(0xDEADBEEF);
  73. desc->addr = rel_addr;
  74. desc->req_size = reqSize;
  75. desc->blk_size = NextPowerOf2(reqSize);
  76. return static_cast<addr_t>(rel_addr * min_);
  77. } else {
  78. return NOSPACE;
  79. }
  80. }
  81. void BuddySpace::FreeNoLock(const BSpaceDescriptor *desc) {
  82. MS_ASSERT(desc->sig == 0XDEADBEEF);
  83. rel_addr_t rel_addr = desc->addr;
  84. size_t blk_size = desc->blk_size;
  85. size_t req_size = desc->req_size;
  86. FreeBuddySeg(rel_addr, blk_size, req_size);
  87. }
  88. void BuddySpace::Free(const BSpaceDescriptor *desc) {
  89. std::lock_guard<std::mutex> lock(mutex_);
  90. return FreeNoLock(desc);
  91. }
  92. std::ostream &operator<<(std::ostream &os, const BuddySpace &s) {
  93. os << "1 unit = " << s.GetMinSize() << "\n"
  94. << "Size of buddy space = " << s.GetMaxSize() << "\n"
  95. << "Number of levels = " << s.num_lvl_ << "\n\n"
  96. << "Percent free = " << s.PercentFree() << "\n"
  97. << "Dumping count array : "
  98. << "\n";
  99. for (int i = 0; i < s.num_lvl_; i++) {
  100. os << "[" << i << "] = " << s.count_[i] << " ";
  101. if (((i + 1) % 4) == 0) {
  102. os << "\n";
  103. }
  104. }
  105. os << "\n";
  106. os << "Dumping allocation info:"
  107. << "\n";
  108. auto max_addr = static_cast<rel_addr_t>(BitLeftShift(1, s.num_lvl_ - 1));
  109. rel_addr_t addr = 0;
  110. while (addr < max_addr) {
  111. size_t sz = 0;
  112. BuddySpace::STATE st;
  113. s.GetBuddySegState(addr, &sz, &st);
  114. os << "Address : " << std::left << std::setw(8) << addr << " Size : " << std::setw(8) << sz << " State : "
  115. << ((st == BuddySpace::STATE::kAlloc) ? "ALLOC" : ((st == BuddySpace::STATE::kFree) ? "FREE" : "Unknown"))
  116. << "\n";
  117. addr += sz;
  118. }
  119. return os;
  120. }
  121. void BuddySpace::GetBuddySegState(const rel_addr_t rel_addr, size_t *rel_sz, STATE *st) const {
  122. char byte;
  123. int pos;
  124. int offset;
  125. uint64_t val = 0;
  126. int shift;
  127. pos = BitRightShift(rel_addr, 2);
  128. offset = rel_addr % 4;
  129. shift = offset * 2;
  130. byte = map_[pos];
  131. switch (offset) {
  132. case 0:
  133. val = byte;
  134. break;
  135. case 1:
  136. case 3:
  137. if (offset == 1) {
  138. val = BitLeftShift(BitAnd(byte, 0x30), shift);
  139. } else {
  140. val = BitLeftShift(BitAnd(byte, 0x03), shift);
  141. }
  142. break;
  143. case 2:
  144. val = BitLeftShift(BitAnd(byte, 0x0F), shift);
  145. break;
  146. }
  147. if (BitAnd(val, ONE_BIT)) {
  148. *rel_sz = 1;
  149. } else if (BitAnd(val, TWO_BIT)) {
  150. *rel_sz = 2;
  151. } else if (BitAnd(val, MORE_BIT)) {
  152. log_t lg = BitAnd(val, 0x0F);
  153. *rel_sz = BitLeftShift(1, lg + 2);
  154. } else {
  155. *st = STATE::kEmpty;
  156. return;
  157. }
  158. *st = BitAnd(val, ALLOC_BIT) ? STATE::kAlloc : STATE::kFree;
  159. }
  160. void BuddySpace::SetBuddySegState(rel_addr_t rel_addr, size_t rel_sz, STATE st) {
  161. int clr;
  162. int mask;
  163. int pos;
  164. int offset;
  165. int val = 0;
  166. int shift;
  167. auto log_sz = static_cast<log_t>(Log2(rel_sz));
  168. pos = BitRightShift(rel_addr, 2);
  169. offset = rel_addr % 4;
  170. shift = offset * 2;
  171. if (rel_sz == 1) {
  172. val = ONE_BIT;
  173. mask = 0xC0;
  174. } else if (rel_sz == 2) {
  175. val = TWO_BIT;
  176. mask = 0xF0;
  177. } else {
  178. val = BitOr(log_sz - 2, MORE_BIT);
  179. mask = 0xFF;
  180. }
  181. if (st == STATE::kAlloc) {
  182. val = BitOr(val, ALLOC_BIT);
  183. } else if (st == STATE::kFree) {
  184. val = BitAnd(val, ~(static_cast<uint64_t>(ALLOC_BIT)));
  185. } else if (st == STATE::kEmpty) {
  186. val = 0;
  187. }
  188. clr = static_cast<int>(~(BitRightShift(mask, shift)));
  189. map_[pos] = static_cast<char>(BitAnd(map_[pos], clr));
  190. map_[pos] = static_cast<char>(BitOr(map_[pos], BitRightShift(val, shift)));
  191. if (st == STATE::kAlloc) {
  192. count_[log_sz]--;
  193. } else if (st == STATE::kFree) {
  194. count_[log_sz]++;
  195. if (rel_addr < hint_[log_sz]) {
  196. hint_[log_sz] = rel_addr;
  197. }
  198. }
  199. }
  200. void BuddySpace::JoinBuddySeg(rel_addr_t addr, size_t blk_sz) {
  201. while (blk_sz < BitLeftShift(1, num_lvl_)) {
  202. rel_addr_t buddy = BitEx(addr, blk_sz);
  203. size_t sz = 0;
  204. STATE st;
  205. GetBuddySegState(buddy, &sz, &st);
  206. if (st == STATE::kFree && sz == blk_sz) {
  207. auto log_sz = static_cast<log_t>(Log2(blk_sz));
  208. rel_addr_t left = (buddy < addr) ? buddy : addr;
  209. rel_addr_t right = left + blk_sz;
  210. MS_ASSERT(count_[log_sz] >= 2);
  211. count_[log_sz] -= 2;
  212. SetBuddySegState(right, blk_sz, STATE::kEmpty);
  213. SetBuddySegState(left, BitLeftShift(blk_sz, 1), STATE::kFree);
  214. for (int i = 0; i < log_sz; i++) {
  215. if (hint_[i] == right) {
  216. hint_[i] = left;
  217. }
  218. }
  219. addr = left;
  220. blk_sz <<= 1u;
  221. } else {
  222. break;
  223. }
  224. }
  225. }
  226. void BuddySpace::TrimBuddySeg(rel_addr_t addr, size_t blk_sz, size_t ask_sz) {
  227. MS_ASSERT(ask_sz < blk_sz);
  228. uint32_t inx = Log2(blk_sz);
  229. size_t remaining_sz = ask_sz;
  230. for (int i = inx; i > 0; i--) {
  231. size_t b_size = BitLeftShift(1, i);
  232. size_t half_sz = BitRightShift(b_size, 1);
  233. count_[i]--;
  234. SetBuddySegState(addr, half_sz, STATE::kFree);
  235. SetBuddySegState(addr + half_sz, half_sz, STATE::kFree);
  236. if (remaining_sz >= half_sz) {
  237. SetBuddySegState(addr, half_sz, STATE::kAlloc);
  238. remaining_sz -= half_sz;
  239. if (remaining_sz == 0) {
  240. break;
  241. }
  242. addr += half_sz;
  243. }
  244. }
  245. }
  246. void BuddySpace::UnTrimBuddySeg(rel_addr_t addr, size_t blk_sz, size_t ask_sz) {
  247. MS_ASSERT(ask_sz < blk_sz);
  248. uint32_t inx = Log2(blk_sz);
  249. size_t remaining_sz = ask_sz;
  250. for (int i = inx; i > 0; i--) {
  251. size_t b_size = BitLeftShift(1, i);
  252. size_t half_sz = BitRightShift(b_size, 1);
  253. if (remaining_sz >= half_sz) {
  254. #ifdef DEBUG
  255. {
  256. size_t sz = 0;
  257. STATE st;
  258. GetBuddySegState(addr, &sz, &st);
  259. MS_ASSERT(sz == half_sz && st == STATE::kAlloc);
  260. }
  261. #endif
  262. SetBuddySegState(addr, half_sz, STATE::kFree);
  263. remaining_sz -= half_sz;
  264. if (remaining_sz == 0) {
  265. JoinBuddySeg(addr, half_sz);
  266. break;
  267. }
  268. addr += half_sz;
  269. }
  270. }
  271. }
  272. rel_addr_t BuddySpace::AllocBuddySeg(uint32_t req_size) noexcept {
  273. uint32_t blk_size = NextPowerOf2(req_size);
  274. int start_inx = static_cast<int>(Log2(blk_size));
  275. bool found = false;
  276. rel_addr_t ask_addr = 0;
  277. auto max_addr = static_cast<rel_addr_t>(BitLeftShift(1, num_lvl_ - 1));
  278. STATE st;
  279. size_t sz = 0;
  280. for (int i = start_inx; !found && i < num_lvl_; i++) {
  281. MS_ASSERT(count_[i] >= 0);
  282. if (count_[i] == 0) {
  283. continue;
  284. }
  285. auto blk_sz = static_cast<size_t>(BitLeftShift(1, i));
  286. ask_addr = hint_[i];
  287. while (ask_addr < max_addr && !found) {
  288. GetBuddySegState(ask_addr, &sz, &st);
  289. if (st == STATE::kFree && sz == blk_sz) {
  290. found = true;
  291. } else {
  292. MS_ASSERT(st != STATE::kEmpty);
  293. ask_addr += ((sz > blk_sz) ? sz : blk_sz);
  294. }
  295. }
  296. }
  297. if (found) {
  298. if (sz > req_size) {
  299. TrimBuddySeg(ask_addr, sz, req_size);
  300. } else {
  301. SetBuddySegState(ask_addr, sz, STATE::kAlloc);
  302. hint_[start_inx] = ask_addr;
  303. }
  304. return ask_addr;
  305. } else {
  306. return static_cast<rel_addr_t>(NOSPACE);
  307. }
  308. }
  309. void BuddySpace::FreeBuddySeg(rel_addr_t addr, size_t blk_size, size_t req_size) {
  310. if (req_size == blk_size) {
  311. #ifdef DEBUG
  312. {
  313. size_t sz = 0;
  314. STATE st;
  315. GetBuddySegState(addr, &sz, &st);
  316. }
  317. #endif
  318. SetBuddySegState(addr, blk_size, STATE::kFree);
  319. JoinBuddySeg(addr, blk_size);
  320. } else {
  321. UnTrimBuddySeg(addr, blk_size, req_size);
  322. }
  323. }
  324. int BuddySpace::PercentFree() const {
  325. uint64_t total_free_sz = 0;
  326. uint64_t max_sz_in_unit = BitLeftShift(1, num_lvl_ - 1);
  327. // Go through the count array without lock
  328. for (int i = 0; i < num_lvl_; i++) {
  329. int cnt = count_[i];
  330. if (cnt == 0) {
  331. continue;
  332. }
  333. uint64_t blk_sz = BitLeftShift(1, i);
  334. total_free_sz += (blk_sz * cnt);
  335. }
  336. return static_cast<int>(static_cast<float>(total_free_sz) / static_cast<float>(max_sz_in_unit) * 100);
  337. }
  338. BuddySpace::BuddySpace(int log_min, int num_lvl)
  339. : hint_(nullptr), count_(nullptr), map_(nullptr), log_min_(log_min), num_lvl_(num_lvl), min_(0), max_(0) {}
  340. BuddySpace::~BuddySpace() {
  341. hint_ = nullptr;
  342. count_ = nullptr;
  343. map_ = nullptr;
  344. }
  345. Status BuddySpace::CreateBuddySpace(std::unique_ptr<BuddySpace> *out_bs, int log_min, int num_lvl) {
  346. Status rc;
  347. auto bs = new (std::nothrow) BuddySpace(log_min, num_lvl);
  348. if (bs == nullptr) {
  349. return Status(StatusCode::kMDOutOfMemory);
  350. }
  351. rc = bs->Init();
  352. if (rc.IsOk()) {
  353. (*out_bs).reset(bs);
  354. } else {
  355. delete bs;
  356. }
  357. return rc;
  358. }
  359. } // namespace dataset
  360. } // namespace mindspore