You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

ec_object_iterator.go 6.2 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224
  1. package iterator
  2. import (
  3. "fmt"
  4. "io"
  5. "math/rand"
  6. "os"
  7. "github.com/samber/lo"
  8. "gitlink.org.cn/cloudream/common/pkgs/logger"
  9. "gitlink.org.cn/cloudream/storage-common/globals"
  10. "gitlink.org.cn/cloudream/storage-common/models"
  11. "gitlink.org.cn/cloudream/storage-common/pkgs/db/model"
  12. "gitlink.org.cn/cloudream/storage-common/pkgs/ec"
  13. coormq "gitlink.org.cn/cloudream/storage-common/pkgs/mq/coordinator"
  14. )
  15. type ECObjectIterator struct {
  16. objects []model.Object
  17. objectECData []models.ObjectECData
  18. currentIndex int
  19. inited bool
  20. ec model.Ec
  21. downloadCtx *ECDownloadContext
  22. cliLocation model.Location
  23. }
  24. type ECDownloadContext struct {
  25. *DownloadContext
  26. ECPacketSize int64
  27. }
  28. func NewECObjectIterator(objects []model.Object, objectECData []models.ObjectECData, ec model.Ec, downloadCtx *ECDownloadContext) *ECObjectIterator {
  29. return &ECObjectIterator{
  30. objects: objects,
  31. objectECData: objectECData,
  32. ec: ec,
  33. downloadCtx: downloadCtx,
  34. }
  35. }
  36. func (i *ECObjectIterator) MoveNext() (*IterDownloadingObject, error) {
  37. coorCli, err := globals.CoordinatorMQPool.Acquire()
  38. if err != nil {
  39. return nil, fmt.Errorf("new coordinator client: %w", err)
  40. }
  41. defer coorCli.Close()
  42. if !i.inited {
  43. i.inited = true
  44. findCliLocResp, err := coorCli.FindClientLocation(coormq.NewFindClientLocation(globals.Local.ExternalIP))
  45. if err != nil {
  46. return nil, fmt.Errorf("finding client location: %w", err)
  47. }
  48. i.cliLocation = findCliLocResp.Location
  49. }
  50. if i.currentIndex >= len(i.objects) {
  51. return nil, ErrNoMoreItem
  52. }
  53. item, err := i.doMove(coorCli)
  54. i.currentIndex++
  55. return item, err
  56. }
  57. func (iter *ECObjectIterator) doMove(coorCli *coormq.PoolClient) (*IterDownloadingObject, error) {
  58. obj := iter.objects[iter.currentIndex]
  59. ecData := iter.objectECData[iter.currentIndex]
  60. blocks := ecData.Blocks
  61. ec := iter.ec
  62. ecK := ec.EcK
  63. ecN := ec.EcN
  64. //采取直接读,优先选内网节点
  65. hashs := make([]string, ecK)
  66. nds := make([]DownloadNodeInfo, ecK)
  67. for i := 0; i < ecK; i++ {
  68. hashs[i] = blocks[i].FileHash
  69. getNodesResp, err := coorCli.GetNodes(coormq.NewGetNodes(blocks[i].NodeIDs))
  70. if err != nil {
  71. return nil, fmt.Errorf("getting nodes: %w", err)
  72. }
  73. downloadNodes := lo.Map(getNodesResp.Nodes, func(node model.Node, index int) DownloadNodeInfo {
  74. return DownloadNodeInfo{
  75. Node: node,
  76. IsSameLocation: node.LocationID == iter.cliLocation.LocationID,
  77. }
  78. })
  79. nds[i] = iter.chooseDownloadNode(downloadNodes)
  80. }
  81. //nodeIDs, nodeIPs直接按照第1~ecK个排列
  82. nodeIDs := make([]int64, ecK)
  83. nodeIPs := make([]string, ecK)
  84. for i := 0; i < ecK; i++ {
  85. nodeIDs[i] = nds[i].Node.NodeID
  86. nodeIPs[i] = nds[i].Node.ExternalIP
  87. if nds[i].IsSameLocation {
  88. nodeIPs[i] = nds[i].Node.LocalIP
  89. logger.Infof("client and node %d are at the same location, use local ip\n", nds[i].Node.NodeID)
  90. }
  91. }
  92. fileSize := obj.Size
  93. blockIDs := make([]int, ecK)
  94. for i := 0; i < ecK; i++ {
  95. blockIDs[i] = i
  96. }
  97. reader, err := iter.downloadEcObject(fileSize, ecK, ecN, blockIDs, nodeIDs, nodeIPs, hashs)
  98. if err != nil {
  99. return nil, fmt.Errorf("ec read failed, err: %w", err)
  100. }
  101. return &IterDownloadingObject{
  102. File: reader,
  103. }, nil
  104. }
  105. func (i *ECObjectIterator) Close() {
  106. }
  107. // chooseDownloadNode 选择一个下载节点
  108. // 1. 从与当前客户端相同地域的节点中随机选一个
  109. // 2. 没有用的话从所有节点中随机选一个
  110. func (i *ECObjectIterator) chooseDownloadNode(entries []DownloadNodeInfo) DownloadNodeInfo {
  111. sameLocationEntries := lo.Filter(entries, func(e DownloadNodeInfo, i int) bool { return e.IsSameLocation })
  112. if len(sameLocationEntries) > 0 {
  113. return sameLocationEntries[rand.Intn(len(sameLocationEntries))]
  114. }
  115. return entries[rand.Intn(len(entries))]
  116. }
  117. func (iter *ECObjectIterator) downloadEcObject(fileSize int64, ecK int, ecN int, blockIDs []int, nodeIDs []int64, nodeIPs []string, hashs []string) (io.ReadCloser, error) {
  118. // TODO zkx 先试用同步方式实现逻辑,做好错误处理。同时也方便下面直接使用uploadToNode和uploadToLocalIPFS来优化代码结构
  119. //wg := sync.WaitGroup{}
  120. numPacket := (fileSize + int64(ecK)*iter.downloadCtx.ECPacketSize - 1) / (int64(ecK) * iter.downloadCtx.ECPacketSize)
  121. getBufs := make([]chan []byte, ecN)
  122. decodeBufs := make([]chan []byte, ecK)
  123. for i := 0; i < ecN; i++ {
  124. getBufs[i] = make(chan []byte)
  125. }
  126. for i := 0; i < ecK; i++ {
  127. decodeBufs[i] = make(chan []byte)
  128. }
  129. for idx := 0; idx < len(blockIDs); idx++ {
  130. i := idx
  131. go func() {
  132. // TODO 处理错误
  133. file, _ := downloadFile(iter.downloadCtx.DownloadContext, nodeIDs[i], nodeIPs[i], hashs[i])
  134. for p := int64(0); p < numPacket; p++ {
  135. buf := make([]byte, iter.downloadCtx.ECPacketSize)
  136. // TODO 处理错误
  137. io.ReadFull(file, buf)
  138. getBufs[blockIDs[i]] <- buf
  139. }
  140. }()
  141. }
  142. print(numPacket)
  143. go decode(getBufs[:], decodeBufs[:], blockIDs, ecK, numPacket)
  144. r, w := io.Pipe()
  145. //persist函数,将解码得到的文件写入pipe
  146. go func() {
  147. for i := 0; int64(i) < numPacket; i++ {
  148. for j := 0; j < len(decodeBufs); j++ {
  149. tmp := <-decodeBufs[j]
  150. _, err := w.Write(tmp)
  151. if err != nil {
  152. fmt.Errorf("persist file falied, err:%w", err)
  153. }
  154. }
  155. }
  156. w.Close()
  157. }()
  158. return r, nil
  159. }
  160. func decode(inBufs []chan []byte, outBufs []chan []byte, blockSeq []int, ecK int, numPacket int64) {
  161. fmt.Println("decode ")
  162. var tmpIn [][]byte
  163. var zeroPkt []byte
  164. tmpIn = make([][]byte, len(inBufs))
  165. hasBlock := map[int]bool{}
  166. for j := 0; j < len(blockSeq); j++ {
  167. hasBlock[blockSeq[j]] = true
  168. }
  169. needRepair := false //检测是否传入了所有数据块
  170. for j := 0; j < len(outBufs); j++ {
  171. if blockSeq[j] != j {
  172. needRepair = true
  173. }
  174. }
  175. enc := ec.NewRsEnc(ecK, len(inBufs))
  176. for i := 0; int64(i) < numPacket; i++ {
  177. print("!!!!!")
  178. for j := 0; j < len(inBufs); j++ {
  179. if hasBlock[j] {
  180. tmpIn[j] = <-inBufs[j]
  181. } else {
  182. tmpIn[j] = zeroPkt
  183. }
  184. }
  185. if needRepair {
  186. err := enc.Repair(tmpIn)
  187. if err != nil {
  188. fmt.Fprintf(os.Stderr, "Decode Repair Error: %s", err.Error())
  189. }
  190. }
  191. for j := 0; j < len(outBufs); j++ {
  192. outBufs[j] <- tmpIn[j]
  193. }
  194. }
  195. for i := 0; i < len(outBufs); i++ {
  196. close(outBufs[i])
  197. }
  198. }

本项目旨在将云际存储公共基础设施化,使个人及企业可低门槛使用高效的云际存储服务(安装开箱即用云际存储客户端即可,无需关注其他组件的部署),同时支持用户灵活便捷定制云际存储的功能细节。