You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

buddy.cc 11 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388
  1. /**
  2. * Copyright 2019 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "minddata/dataset/util/buddy.h"
  17. #include <iomanip>
  18. #include <stdexcept>
  19. #include "minddata/dataset/util/memory_pool.h"
  20. #include "minddata/dataset/util/system_pool.h"
  21. #include "utils/log_adapter.h"
  22. #include "./securec.h"
  23. inline uint64_t BitLeftShift(uint64_t v, uint64_t n) { return (v << n); }
  24. inline uint64_t BitRightShift(uint64_t v, uint64_t n) { return (v >> n); }
  25. inline uint64_t BitOr(uint64_t rhs, uint64_t lhs) { return rhs | lhs; }
  26. inline uint64_t BitEx(uint64_t rhs, uint64_t lhs) { return rhs ^ lhs; }
  27. inline uint64_t BitAnd(uint64_t rhs, uint64_t lhs) { return rhs & lhs; }
  28. namespace mindspore {
  29. namespace dataset {
  30. Status BuddySpace::Init() {
  31. if (log_min_ < 0) {
  32. return Status(StatusCode::kUnexpectedError, __LINE__, __FILE__,
  33. "log_min must be positive : " + std::to_string(log_min_));
  34. }
  35. if (num_lvl_ < 3 || num_lvl_ > 18) {
  36. return Status(StatusCode::kUnexpectedError, __LINE__, __FILE__,
  37. "num_lvl must be between 3 and 18 : " + std::to_string(num_lvl_));
  38. }
  39. min_ = BitLeftShift(1, log_min_);
  40. max_ = BitLeftShift(1, log_min_ + num_lvl_ - 1);
  41. size_t offset_1 = sizeof(rel_addr_t) * num_lvl_;
  42. size_t offset_2 = sizeof(int) * num_lvl_ + offset_1;
  43. size_t offset_3 = sizeof(char) * BitLeftShift(1, num_lvl_ - 3) + offset_2;
  44. RETURN_IF_NOT_OK(DeMalloc(offset_3, &ptr_, true));
  45. hint_ = reinterpret_cast<rel_addr_t *>(ptr_);
  46. count_ = reinterpret_cast<int *>((reinterpret_cast<char *>(ptr_) + offset_1));
  47. map_ = reinterpret_cast<char *>(ptr_) + offset_2;
  48. count_[num_lvl_ - 1] = 1;
  49. map_[0] = BitOr(MORE_BIT, num_lvl_ - 3);
  50. return Status::OK();
  51. }
  52. Status BuddySpace::Alloc(const uint64_t sz, BSpaceDescriptor *desc, addr_t *p) noexcept {
  53. std::lock_guard<std::mutex> lock(mutex_);
  54. addr_t addr = AllocNoLock(sz, desc);
  55. if (addr != NOSPACE) {
  56. *p = addr;
  57. return Status::OK();
  58. } else {
  59. return Status(StatusCode::kNoSpace, "BuddySpace full. Not an error. Please ignore.");
  60. }
  61. }
  62. addr_t BuddySpace::AllocNoLock(const uint64_t sz, BSpaceDescriptor *desc) noexcept {
  63. MS_ASSERT(sz <= max_);
  64. uint32_t reqSize = SizeToBlock(sz);
  65. rel_addr_t rel_addr = AllocBuddySeg(reqSize);
  66. if (rel_addr != static_cast<rel_addr_t>(NOSPACE)) {
  67. (void)memset_s(desc, sizeof(BSpaceDescriptor), 0, sizeof(BSpaceDescriptor));
  68. desc->sig = static_cast<int>(0xDEADBEEF);
  69. desc->addr = rel_addr;
  70. desc->req_size = reqSize;
  71. desc->blk_size = NextPowerOf2(reqSize);
  72. return static_cast<addr_t>(rel_addr * min_);
  73. } else {
  74. return NOSPACE;
  75. }
  76. }
  77. void BuddySpace::FreeNoLock(const BSpaceDescriptor *desc) {
  78. MS_ASSERT(desc->sig == 0XDEADBEEF);
  79. rel_addr_t rel_addr = desc->addr;
  80. size_t blk_size = desc->blk_size;
  81. size_t req_size = desc->req_size;
  82. FreeBuddySeg(rel_addr, blk_size, req_size);
  83. }
  84. void BuddySpace::Free(const BSpaceDescriptor *desc) {
  85. std::lock_guard<std::mutex> lock(mutex_);
  86. return FreeNoLock(desc);
  87. }
  88. std::ostream &operator<<(std::ostream &os, const BuddySpace &s) {
  89. os << "1 unit = " << s.GetMinSize() << "\n"
  90. << "Size of buddy space = " << s.GetMaxSize() << "\n"
  91. << "Number of levels = " << s.num_lvl_ << "\n\n"
  92. << "Percent free = " << s.PercentFree() << "\n"
  93. << "Dumping count array : "
  94. << "\n";
  95. for (int i = 0; i < s.num_lvl_; i++) {
  96. os << "[" << i << "] = " << s.count_[i] << " ";
  97. if (((i + 1) % 4) == 0) {
  98. os << "\n";
  99. }
  100. }
  101. os << "\n";
  102. os << "Dumping allocation info:"
  103. << "\n";
  104. auto max_addr = static_cast<rel_addr_t>(BitLeftShift(1, s.num_lvl_ - 1));
  105. rel_addr_t addr = 0;
  106. while (addr < max_addr) {
  107. size_t sz = 0;
  108. BuddySpace::STATE st;
  109. s.GetBuddySegState(addr, &sz, &st);
  110. os << "Address : " << std::left << std::setw(8) << addr << " Size : " << std::setw(8) << sz << " State : "
  111. << ((st == BuddySpace::STATE::kAlloc) ? "ALLOC" : ((st == BuddySpace::STATE::kFree) ? "FREE" : "Unkonwn"))
  112. << "\n";
  113. addr += sz;
  114. }
  115. return os;
  116. }
  117. void BuddySpace::GetBuddySegState(const rel_addr_t rel_addr, size_t *rel_sz, STATE *st) const {
  118. char byte;
  119. int pos;
  120. int offset;
  121. uint64_t val = 0;
  122. int shift;
  123. pos = BitRightShift(rel_addr, 2);
  124. offset = rel_addr % 4;
  125. shift = offset * 2;
  126. byte = map_[pos];
  127. switch (offset) {
  128. case 0:
  129. val = byte;
  130. break;
  131. case 1:
  132. case 3:
  133. if (offset == 1) {
  134. val = BitLeftShift(BitAnd(byte, 0x30), shift);
  135. } else {
  136. val = BitLeftShift(BitAnd(byte, 0x03), shift);
  137. }
  138. break;
  139. case 2:
  140. val = BitLeftShift(BitAnd(byte, 0x0F), shift);
  141. break;
  142. }
  143. if (BitAnd(val, ONE_BIT)) {
  144. *rel_sz = 1;
  145. } else if (BitAnd(val, TWO_BIT)) {
  146. *rel_sz = 2;
  147. } else if (BitAnd(val, MORE_BIT)) {
  148. log_t lg = BitAnd(val, 0x0F);
  149. *rel_sz = BitLeftShift(1, lg + 2);
  150. } else {
  151. *st = STATE::kEmpty;
  152. return;
  153. }
  154. *st = BitAnd(val, ALLOC_BIT) ? STATE::kAlloc : STATE::kFree;
  155. }
  156. void BuddySpace::SetBuddySegState(rel_addr_t rel_addr, size_t rel_sz, STATE st) {
  157. int clr;
  158. int mask;
  159. int pos;
  160. int offset;
  161. int val = 0;
  162. int shift;
  163. auto log_sz = static_cast<log_t>(Log2(rel_sz));
  164. pos = BitRightShift(rel_addr, 2);
  165. offset = rel_addr % 4;
  166. shift = offset * 2;
  167. if (rel_sz == 1) {
  168. val = ONE_BIT;
  169. mask = 0xC0;
  170. } else if (rel_sz == 2) {
  171. val = TWO_BIT;
  172. mask = 0xF0;
  173. } else {
  174. val = BitOr(log_sz - 2, MORE_BIT);
  175. mask = 0xFF;
  176. }
  177. if (st == STATE::kAlloc) {
  178. val = BitOr(val, ALLOC_BIT);
  179. } else if (st == STATE::kFree) {
  180. val = BitAnd(val, ~(static_cast<uint64_t>(ALLOC_BIT)));
  181. } else if (st == STATE::kEmpty) {
  182. val = 0;
  183. }
  184. clr = static_cast<int>(~(BitRightShift(mask, shift)));
  185. map_[pos] = static_cast<char>(BitAnd(map_[pos], clr));
  186. map_[pos] = static_cast<char>(BitOr(map_[pos], BitRightShift(val, shift)));
  187. if (st == STATE::kAlloc) {
  188. count_[log_sz]--;
  189. } else if (st == STATE::kFree) {
  190. count_[log_sz]++;
  191. if (rel_addr < hint_[log_sz]) {
  192. hint_[log_sz] = rel_addr;
  193. }
  194. }
  195. }
  196. void BuddySpace::JoinBuddySeg(rel_addr_t addr, size_t blk_sz) {
  197. while (blk_sz < BitLeftShift(1, num_lvl_)) {
  198. rel_addr_t buddy = BitEx(addr, blk_sz);
  199. size_t sz = 0;
  200. STATE st;
  201. GetBuddySegState(buddy, &sz, &st);
  202. if (st == STATE::kFree && sz == blk_sz) {
  203. auto log_sz = static_cast<log_t>(Log2(blk_sz));
  204. rel_addr_t left = (buddy < addr) ? buddy : addr;
  205. rel_addr_t right = left + blk_sz;
  206. MS_ASSERT(count_[log_sz] >= 2);
  207. count_[log_sz] -= 2;
  208. SetBuddySegState(right, blk_sz, STATE::kEmpty);
  209. SetBuddySegState(left, BitLeftShift(blk_sz, 1), STATE::kFree);
  210. for (int i = 0; i < log_sz; i++) {
  211. if (hint_[i] == right) {
  212. hint_[i] = left;
  213. }
  214. }
  215. addr = left;
  216. blk_sz <<= 1u;
  217. } else {
  218. break;
  219. }
  220. }
  221. }
  222. void BuddySpace::TrimBuddySeg(rel_addr_t addr, size_t blk_sz, size_t ask_sz) {
  223. MS_ASSERT(ask_sz < blk_sz);
  224. uint32_t inx = Log2(blk_sz);
  225. size_t remaining_sz = ask_sz;
  226. for (int i = inx; i > 0; i--) {
  227. size_t b_size = BitLeftShift(1, i);
  228. size_t half_sz = BitRightShift(b_size, 1);
  229. count_[i]--;
  230. SetBuddySegState(addr, half_sz, STATE::kFree);
  231. SetBuddySegState(addr + half_sz, half_sz, STATE::kFree);
  232. if (remaining_sz >= half_sz) {
  233. SetBuddySegState(addr, half_sz, STATE::kAlloc);
  234. remaining_sz -= half_sz;
  235. if (remaining_sz == 0) {
  236. break;
  237. }
  238. addr += half_sz;
  239. }
  240. }
  241. }
  242. void BuddySpace::UnTrimBuddySeg(rel_addr_t addr, size_t blk_sz, size_t ask_sz) {
  243. MS_ASSERT(ask_sz < blk_sz);
  244. uint32_t inx = Log2(blk_sz);
  245. size_t remaining_sz = ask_sz;
  246. for (int i = inx; i > 0; i--) {
  247. size_t b_size = BitLeftShift(1, i);
  248. size_t half_sz = BitRightShift(b_size, 1);
  249. if (remaining_sz >= half_sz) {
  250. #ifdef DEBUG
  251. {
  252. size_t sz = 0;
  253. STATE st;
  254. GetBuddySegState(addr, &sz, &st);
  255. MS_ASSERT(sz == half_sz && st == STATE::kAlloc);
  256. }
  257. #endif
  258. SetBuddySegState(addr, half_sz, STATE::kFree);
  259. remaining_sz -= half_sz;
  260. if (remaining_sz == 0) {
  261. JoinBuddySeg(addr, half_sz);
  262. break;
  263. }
  264. addr += half_sz;
  265. }
  266. }
  267. }
  268. rel_addr_t BuddySpace::AllocBuddySeg(uint32_t req_size) noexcept {
  269. uint32_t blk_size = NextPowerOf2(req_size);
  270. int start_inx = static_cast<int>(Log2(blk_size));
  271. bool found = false;
  272. rel_addr_t ask_addr = 0;
  273. auto max_addr = static_cast<rel_addr_t>(BitLeftShift(1, num_lvl_ - 1));
  274. STATE st;
  275. size_t sz = 0;
  276. for (int i = start_inx; !found && i < num_lvl_; i++) {
  277. MS_ASSERT(count_[i] >= 0);
  278. if (count_[i] == 0) {
  279. continue;
  280. }
  281. auto blk_sz = static_cast<size_t>(BitLeftShift(1, i));
  282. ask_addr = hint_[i];
  283. while (ask_addr < max_addr && !found) {
  284. GetBuddySegState(ask_addr, &sz, &st);
  285. if (st == STATE::kFree && sz == blk_sz) {
  286. found = true;
  287. } else {
  288. MS_ASSERT(st != STATE::kEmpty);
  289. ask_addr += ((sz > blk_sz) ? sz : blk_sz);
  290. }
  291. }
  292. }
  293. if (found) {
  294. if (sz > req_size) {
  295. TrimBuddySeg(ask_addr, sz, req_size);
  296. } else {
  297. SetBuddySegState(ask_addr, sz, STATE::kAlloc);
  298. hint_[start_inx] = ask_addr;
  299. }
  300. return ask_addr;
  301. } else {
  302. return static_cast<rel_addr_t>(NOSPACE);
  303. }
  304. }
  305. void BuddySpace::FreeBuddySeg(rel_addr_t addr, size_t blk_size, size_t req_size) {
  306. if (req_size == blk_size) {
  307. #ifdef DEBUG
  308. {
  309. size_t sz = 0;
  310. STATE st;
  311. GetBuddySegState(addr, &sz, &st);
  312. }
  313. #endif
  314. SetBuddySegState(addr, blk_size, STATE::kFree);
  315. JoinBuddySeg(addr, blk_size);
  316. } else {
  317. UnTrimBuddySeg(addr, blk_size, req_size);
  318. }
  319. }
  320. int BuddySpace::PercentFree() const {
  321. uint64_t total_free_sz = 0;
  322. uint64_t max_sz_in_unit = BitLeftShift(1, num_lvl_ - 1);
  323. // Go through the count array without lock
  324. for (int i = 0; i < num_lvl_; i++) {
  325. int cnt = count_[i];
  326. if (cnt == 0) {
  327. continue;
  328. }
  329. uint64_t blk_sz = BitLeftShift(1, i);
  330. total_free_sz += (blk_sz * cnt);
  331. }
  332. return static_cast<int>(static_cast<float>(total_free_sz) / static_cast<float>(max_sz_in_unit) * 100);
  333. }
  334. BuddySpace::BuddySpace(int log_min, int num_lvl)
  335. : hint_(nullptr),
  336. count_(nullptr),
  337. map_(nullptr),
  338. log_min_(log_min),
  339. num_lvl_(num_lvl),
  340. min_(0),
  341. max_(0),
  342. ptr_(nullptr) {}
  343. BuddySpace::~BuddySpace() {
  344. if (ptr_ != nullptr) {
  345. free(ptr_);
  346. }
  347. hint_ = nullptr;
  348. count_ = nullptr;
  349. map_ = nullptr;
  350. }
  351. Status BuddySpace::CreateBuddySpace(std::unique_ptr<BuddySpace> *out_bs, int log_min, int num_lvl) {
  352. Status rc;
  353. auto bs = new (std::nothrow) BuddySpace(log_min, num_lvl);
  354. if (bs == nullptr) {
  355. return Status(StatusCode::kOutOfMemory);
  356. }
  357. rc = bs->Init();
  358. if (rc.IsOk()) {
  359. (*out_bs).reset(bs);
  360. } else {
  361. delete bs;
  362. }
  363. return rc;
  364. }
  365. } // namespace dataset
  366. } // namespace mindspore