You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

storage_load_package.go 10 kB

2 years ago
2 years ago
2 years ago
2 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356
  1. package task
  2. import (
  3. "fmt"
  4. "io"
  5. "math"
  6. "os"
  7. "path/filepath"
  8. "time"
  9. "github.com/samber/lo"
  10. "gitlink.org.cn/cloudream/common/pkgs/bitmap"
  11. "gitlink.org.cn/cloudream/common/pkgs/ipfs"
  12. "gitlink.org.cn/cloudream/common/pkgs/task"
  13. cdssdk "gitlink.org.cn/cloudream/common/sdks/storage"
  14. "gitlink.org.cn/cloudream/common/utils/io2"
  15. "gitlink.org.cn/cloudream/common/utils/reflect2"
  16. "gitlink.org.cn/cloudream/common/utils/sort2"
  17. "gitlink.org.cn/cloudream/storage/common/consts"
  18. stgglb "gitlink.org.cn/cloudream/storage/common/globals"
  19. stgmod "gitlink.org.cn/cloudream/storage/common/models"
  20. "gitlink.org.cn/cloudream/storage/common/pkgs/distlock/reqbuilder"
  21. "gitlink.org.cn/cloudream/storage/common/pkgs/ec"
  22. coormq "gitlink.org.cn/cloudream/storage/common/pkgs/mq/coordinator"
  23. "gitlink.org.cn/cloudream/storage/common/utils"
  24. )
  25. type StorageLoadPackage struct {
  26. PackagePath string
  27. LocalBase string
  28. RemoteBase string
  29. userID cdssdk.UserID
  30. packageID cdssdk.PackageID
  31. storageID cdssdk.StorageID
  32. pinnedBlocks []stgmod.ObjectBlock
  33. }
  34. func NewStorageLoadPackage(userID cdssdk.UserID, packageID cdssdk.PackageID, storageID cdssdk.StorageID) *StorageLoadPackage {
  35. return &StorageLoadPackage{
  36. userID: userID,
  37. packageID: packageID,
  38. storageID: storageID,
  39. }
  40. }
  41. func (t *StorageLoadPackage) Execute(task *task.Task[TaskContext], ctx TaskContext, complete CompleteFn) {
  42. err := t.do(task, ctx)
  43. complete(err, CompleteOption{
  44. RemovingDelay: time.Minute,
  45. })
  46. }
  47. func (t *StorageLoadPackage) do(task *task.Task[TaskContext], ctx TaskContext) error {
  48. coorCli, err := stgglb.CoordinatorMQPool.Acquire()
  49. if err != nil {
  50. return fmt.Errorf("new coordinator client: %w", err)
  51. }
  52. defer stgglb.CoordinatorMQPool.Release(coorCli)
  53. ipfsCli, err := stgglb.IPFSPool.Acquire()
  54. if err != nil {
  55. return fmt.Errorf("new IPFS client: %w", err)
  56. }
  57. defer stgglb.IPFSPool.Release(ipfsCli)
  58. getStgResp, err := coorCli.GetStorage(coormq.ReqGetStorage(t.userID, t.storageID))
  59. if err != nil {
  60. return fmt.Errorf("request to coordinator: %w", err)
  61. }
  62. t.PackagePath = utils.MakeLoadedPackagePath(t.userID, t.packageID)
  63. fullLocalPath := filepath.Join(getStgResp.Storage.LocalBase, t.PackagePath)
  64. if err = os.MkdirAll(fullLocalPath, 0755); err != nil {
  65. return fmt.Errorf("creating output directory: %w", err)
  66. }
  67. getObjectDetails, err := coorCli.GetPackageObjectDetails(coormq.ReqGetPackageObjectDetails(t.packageID))
  68. if err != nil {
  69. return fmt.Errorf("getting package object details: %w", err)
  70. }
  71. mutex, err := reqbuilder.NewBuilder().
  72. // 提前占位
  73. Metadata().StoragePackage().CreateOne(t.userID, t.storageID, t.packageID).
  74. // 保护在storage目录中下载的文件
  75. Storage().Buzy(t.storageID).
  76. // 保护下载文件时同时保存到IPFS的文件
  77. IPFS().Buzy(getStgResp.Storage.NodeID).
  78. MutexLock(ctx.distlock)
  79. if err != nil {
  80. return fmt.Errorf("acquire locks failed, err: %w", err)
  81. }
  82. defer mutex.Unlock()
  83. for _, obj := range getObjectDetails.Objects {
  84. err := t.downloadOne(coorCli, ipfsCli, fullLocalPath, obj)
  85. if err != nil {
  86. return err
  87. }
  88. ctx.accessStat.AddAccessCounter(obj.Object.ObjectID, t.packageID, *stgglb.Local.NodeID, 1)
  89. }
  90. _, err = coorCli.StoragePackageLoaded(coormq.NewStoragePackageLoaded(t.userID, t.storageID, t.packageID, t.pinnedBlocks))
  91. if err != nil {
  92. return fmt.Errorf("loading package to storage: %w", err)
  93. }
  94. // TODO 要防止下载的临时文件被删除
  95. return err
  96. }
  97. func (t *StorageLoadPackage) downloadOne(coorCli *coormq.Client, ipfsCli *ipfs.PoolClient, dir string, obj stgmod.ObjectDetail) error {
  98. var file io.ReadCloser
  99. switch red := obj.Object.Redundancy.(type) {
  100. case *cdssdk.NoneRedundancy:
  101. reader, err := t.downloadNoneOrRepObject(ipfsCli, obj)
  102. if err != nil {
  103. return fmt.Errorf("downloading object: %w", err)
  104. }
  105. file = reader
  106. case *cdssdk.RepRedundancy:
  107. reader, err := t.downloadNoneOrRepObject(ipfsCli, obj)
  108. if err != nil {
  109. return fmt.Errorf("downloading rep object: %w", err)
  110. }
  111. file = reader
  112. case *cdssdk.ECRedundancy:
  113. reader, pinnedBlocks, err := t.downloadECObject(coorCli, ipfsCli, obj, red)
  114. if err != nil {
  115. return fmt.Errorf("downloading ec object: %w", err)
  116. }
  117. file = reader
  118. t.pinnedBlocks = append(t.pinnedBlocks, pinnedBlocks...)
  119. default:
  120. return fmt.Errorf("unknow redundancy type: %v", reflect2.TypeOfValue(obj.Object.Redundancy))
  121. }
  122. defer file.Close()
  123. fullPath := filepath.Join(dir, obj.Object.Path)
  124. lastDirPath := filepath.Dir(fullPath)
  125. if err := os.MkdirAll(lastDirPath, 0755); err != nil {
  126. return fmt.Errorf("creating object last dir: %w", err)
  127. }
  128. outputFile, err := os.Create(fullPath)
  129. if err != nil {
  130. return fmt.Errorf("creating object file: %w", err)
  131. }
  132. defer outputFile.Close()
  133. if _, err := io.Copy(outputFile, file); err != nil {
  134. return fmt.Errorf("writting object to file: %w", err)
  135. }
  136. return nil
  137. }
  138. func (t *StorageLoadPackage) downloadNoneOrRepObject(ipfsCli *ipfs.PoolClient, obj stgmod.ObjectDetail) (io.ReadCloser, error) {
  139. if len(obj.Blocks) == 0 && len(obj.PinnedAt) == 0 {
  140. return nil, fmt.Errorf("no node has this object")
  141. }
  142. // 不管实际有没有成功
  143. ipfsCli.Pin(obj.Object.FileHash)
  144. file, err := ipfsCli.OpenRead(obj.Object.FileHash)
  145. if err != nil {
  146. return nil, err
  147. }
  148. return file, nil
  149. }
  150. func (t *StorageLoadPackage) downloadECObject(coorCli *coormq.Client, ipfsCli *ipfs.PoolClient, obj stgmod.ObjectDetail, ecRed *cdssdk.ECRedundancy) (io.ReadCloser, []stgmod.ObjectBlock, error) {
  151. allNodes, err := t.sortDownloadNodes(coorCli, obj)
  152. if err != nil {
  153. return nil, nil, err
  154. }
  155. bsc, blocks := t.getMinReadingBlockSolution(allNodes, ecRed.K)
  156. osc, _ := t.getMinReadingObjectSolution(allNodes, ecRed.K)
  157. if bsc < osc {
  158. var fileStrs []io.ReadCloser
  159. rs, err := ec.NewStreamRs(ecRed.K, ecRed.N, ecRed.ChunkSize)
  160. if err != nil {
  161. return nil, nil, fmt.Errorf("new rs: %w", err)
  162. }
  163. for i := range blocks {
  164. // 不管实际有没有成功
  165. ipfsCli.Pin(blocks[i].Block.FileHash)
  166. str, err := ipfsCli.OpenRead(blocks[i].Block.FileHash)
  167. if err != nil {
  168. for i -= 1; i >= 0; i-- {
  169. fileStrs[i].Close()
  170. }
  171. return nil, nil, fmt.Errorf("donwloading file: %w", err)
  172. }
  173. fileStrs = append(fileStrs, str)
  174. }
  175. fileReaders, filesCloser := io2.ToReaders(fileStrs)
  176. var indexes []int
  177. var pinnedBlocks []stgmod.ObjectBlock
  178. for _, b := range blocks {
  179. indexes = append(indexes, b.Block.Index)
  180. pinnedBlocks = append(pinnedBlocks, stgmod.ObjectBlock{
  181. ObjectID: b.Block.ObjectID,
  182. Index: b.Block.Index,
  183. NodeID: *stgglb.Local.NodeID,
  184. FileHash: b.Block.FileHash,
  185. })
  186. }
  187. outputs, outputsCloser := io2.ToReaders(rs.ReconstructData(fileReaders, indexes))
  188. return io2.AfterReadClosed(io2.Length(io2.ChunkedJoin(outputs, int(ecRed.ChunkSize)), obj.Object.Size), func(c io.ReadCloser) {
  189. filesCloser()
  190. outputsCloser()
  191. }), pinnedBlocks, nil
  192. }
  193. // bsc >= osc,如果osc是MaxFloat64,那么bsc也一定是,也就意味着没有足够块来恢复文件
  194. if osc == math.MaxFloat64 {
  195. return nil, nil, fmt.Errorf("no enough blocks to reconstruct the file, want %d, get only %d", ecRed.K, len(blocks))
  196. }
  197. // 如果是直接读取的文件,那么就不需要Pin文件块
  198. str, err := ipfsCli.OpenRead(obj.Object.FileHash)
  199. return str, nil, err
  200. }
  201. type downloadNodeInfo struct {
  202. Node cdssdk.Node
  203. ObjectPinned bool
  204. Blocks []stgmod.ObjectBlock
  205. Distance float64
  206. }
  207. func (t *StorageLoadPackage) sortDownloadNodes(coorCli *coormq.Client, obj stgmod.ObjectDetail) ([]*downloadNodeInfo, error) {
  208. var nodeIDs []cdssdk.NodeID
  209. for _, id := range obj.PinnedAt {
  210. if !lo.Contains(nodeIDs, id) {
  211. nodeIDs = append(nodeIDs, id)
  212. }
  213. }
  214. for _, b := range obj.Blocks {
  215. if !lo.Contains(nodeIDs, b.NodeID) {
  216. nodeIDs = append(nodeIDs, b.NodeID)
  217. }
  218. }
  219. getNodes, err := coorCli.GetNodes(coormq.NewGetNodes(nodeIDs))
  220. if err != nil {
  221. return nil, fmt.Errorf("getting nodes: %w", err)
  222. }
  223. downloadNodeMap := make(map[cdssdk.NodeID]*downloadNodeInfo)
  224. for _, id := range obj.PinnedAt {
  225. node, ok := downloadNodeMap[id]
  226. if !ok {
  227. mod := *getNodes.GetNode(id)
  228. node = &downloadNodeInfo{
  229. Node: mod,
  230. ObjectPinned: true,
  231. Distance: t.getNodeDistance(mod),
  232. }
  233. downloadNodeMap[id] = node
  234. }
  235. node.ObjectPinned = true
  236. }
  237. for _, b := range obj.Blocks {
  238. node, ok := downloadNodeMap[b.NodeID]
  239. if !ok {
  240. mod := *getNodes.GetNode(b.NodeID)
  241. node = &downloadNodeInfo{
  242. Node: mod,
  243. Distance: t.getNodeDistance(mod),
  244. }
  245. downloadNodeMap[b.NodeID] = node
  246. }
  247. node.Blocks = append(node.Blocks, b)
  248. }
  249. return sort2.Sort(lo.Values(downloadNodeMap), func(left, right *downloadNodeInfo) int {
  250. return sort2.Cmp(left.Distance, right.Distance)
  251. }), nil
  252. }
  253. type downloadBlock struct {
  254. Node cdssdk.Node
  255. Block stgmod.ObjectBlock
  256. }
  257. func (t *StorageLoadPackage) getMinReadingBlockSolution(sortedNodes []*downloadNodeInfo, k int) (float64, []downloadBlock) {
  258. gotBlocksMap := bitmap.Bitmap64(0)
  259. var gotBlocks []downloadBlock
  260. dist := float64(0.0)
  261. for _, n := range sortedNodes {
  262. for _, b := range n.Blocks {
  263. if !gotBlocksMap.Get(b.Index) {
  264. gotBlocks = append(gotBlocks, downloadBlock{
  265. Node: n.Node,
  266. Block: b,
  267. })
  268. gotBlocksMap.Set(b.Index, true)
  269. dist += n.Distance
  270. }
  271. if len(gotBlocks) >= k {
  272. return dist, gotBlocks
  273. }
  274. }
  275. }
  276. return math.MaxFloat64, gotBlocks
  277. }
  278. func (t *StorageLoadPackage) getMinReadingObjectSolution(sortedNodes []*downloadNodeInfo, k int) (float64, *cdssdk.Node) {
  279. dist := math.MaxFloat64
  280. var downloadNode *cdssdk.Node
  281. for _, n := range sortedNodes {
  282. if n.ObjectPinned && float64(k)*n.Distance < dist {
  283. dist = float64(k) * n.Distance
  284. downloadNode = &n.Node
  285. }
  286. }
  287. return dist, downloadNode
  288. }
  289. func (t *StorageLoadPackage) getNodeDistance(node cdssdk.Node) float64 {
  290. if stgglb.Local.NodeID != nil {
  291. if node.NodeID == *stgglb.Local.NodeID {
  292. return consts.NodeDistanceSameNode
  293. }
  294. }
  295. if node.LocationID == stgglb.Local.LocationID {
  296. return consts.NodeDistanceSameLocation
  297. }
  298. return consts.NodeDistanceOther
  299. }

本项目旨在将云际存储公共基础设施化,使个人及企业可低门槛使用高效的云际存储服务(安装开箱即用云际存储客户端即可,无需关注其他组件的部署),同时支持用户灵活便捷定制云际存储的功能细节。