You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

object.go 12 kB

2 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380
  1. package db
  2. import (
  3. "fmt"
  4. "strings"
  5. "time"
  6. "github.com/jmoiron/sqlx"
  7. "github.com/samber/lo"
  8. cdssdk "gitlink.org.cn/cloudream/common/sdks/storage"
  9. "gitlink.org.cn/cloudream/common/utils/sort2"
  10. stgmod "gitlink.org.cn/cloudream/storage/common/models"
  11. "gitlink.org.cn/cloudream/storage/common/pkgs/db/model"
  12. coormq "gitlink.org.cn/cloudream/storage/common/pkgs/mq/coordinator"
  13. )
  14. type ObjectDB struct {
  15. *DB
  16. }
  17. func (db *DB) Object() *ObjectDB {
  18. return &ObjectDB{DB: db}
  19. }
  20. func (db *ObjectDB) GetByID(ctx SQLContext, objectID cdssdk.ObjectID) (model.Object, error) {
  21. var ret model.TempObject
  22. err := sqlx.Get(ctx, &ret, "select * from Object where ObjectID = ?", objectID)
  23. return ret.ToObject(), err
  24. }
  25. func (db *ObjectDB) BatchTestObjectID(ctx SQLContext, objectIDs []cdssdk.ObjectID) (map[cdssdk.ObjectID]bool, error) {
  26. if len(objectIDs) == 0 {
  27. return make(map[cdssdk.ObjectID]bool), nil
  28. }
  29. stmt, args, err := sqlx.In("select ObjectID from Object where ObjectID in (?)", lo.Uniq(objectIDs))
  30. if err != nil {
  31. return nil, err
  32. }
  33. var avaiIDs []cdssdk.ObjectID
  34. err = sqlx.Select(ctx, &avaiIDs, stmt, args...)
  35. if err != nil {
  36. return nil, err
  37. }
  38. avaiIDMap := make(map[cdssdk.ObjectID]bool)
  39. for _, pkgID := range avaiIDs {
  40. avaiIDMap[pkgID] = true
  41. }
  42. return avaiIDMap, nil
  43. }
  44. func (db *ObjectDB) BatchGet(ctx SQLContext, objectIDs []cdssdk.ObjectID) ([]model.Object, error) {
  45. if len(objectIDs) == 0 {
  46. return nil, nil
  47. }
  48. // TODO In语句
  49. stmt, args, err := sqlx.In("select * from Object where ObjectID in (?) order by ObjectID asc", objectIDs)
  50. if err != nil {
  51. return nil, err
  52. }
  53. stmt = ctx.Rebind(stmt)
  54. objs := make([]model.TempObject, 0, len(objectIDs))
  55. err = sqlx.Select(ctx, &objs, stmt, args...)
  56. if err != nil {
  57. return nil, err
  58. }
  59. return lo.Map(objs, func(o model.TempObject, idx int) cdssdk.Object { return o.ToObject() }), nil
  60. }
  61. func (db *ObjectDB) BatchGetByPackagePath(ctx SQLContext, pkgID cdssdk.PackageID, pathes []string) ([]cdssdk.Object, error) {
  62. if len(pathes) == 0 {
  63. return nil, nil
  64. }
  65. // TODO In语句
  66. stmt, args, err := sqlx.In("select * from Object force index(PackagePath) where PackageID=? and Path in (?)", pkgID, pathes)
  67. if err != nil {
  68. return nil, err
  69. }
  70. stmt = ctx.Rebind(stmt)
  71. objs := make([]model.TempObject, 0, len(pathes))
  72. err = sqlx.Select(ctx, &objs, stmt, args...)
  73. if err != nil {
  74. return nil, err
  75. }
  76. return lo.Map(objs, func(o model.TempObject, idx int) cdssdk.Object { return o.ToObject() }), nil
  77. }
  78. func (db *ObjectDB) Create(ctx SQLContext, obj cdssdk.Object) (cdssdk.ObjectID, error) {
  79. sql := "insert into Object(PackageID, Path, Size, FileHash, Redundancy, CreateTime, UpdateTime) values(?,?,?,?,?,?,?)"
  80. ret, err := ctx.Exec(sql, obj.PackageID, obj.Path, obj.Size, obj.FileHash, obj.Redundancy, obj.UpdateTime, obj.UpdateTime)
  81. if err != nil {
  82. return 0, fmt.Errorf("insert object failed, err: %w", err)
  83. }
  84. objectID, err := ret.LastInsertId()
  85. if err != nil {
  86. return 0, fmt.Errorf("get id of inserted object failed, err: %w", err)
  87. }
  88. return cdssdk.ObjectID(objectID), nil
  89. }
  90. // 可以用于批量创建或者更新记录。
  91. // 用于创建时,需要额外检查PackageID+Path的唯一性。
  92. // 用于更新时,需要额外检查现存的PackageID+Path对应的ObjectID是否与待更新的ObjectID相同。不会更新CreateTime。
  93. func (db *ObjectDB) BatchUpsertByPackagePath(ctx SQLContext, objs []cdssdk.Object) error {
  94. if len(objs) == 0 {
  95. return nil
  96. }
  97. sql := "insert into Object(PackageID, Path, Size, FileHash, Redundancy, CreateTime ,UpdateTime)" +
  98. " values(:PackageID,:Path,:Size,:FileHash,:Redundancy, :CreateTime, :UpdateTime) as new" +
  99. " on duplicate key update Size = new.Size, FileHash = new.FileHash, Redundancy = new.Redundancy, UpdateTime = new.UpdateTime"
  100. return BatchNamedExec(ctx, sql, 7, objs, nil)
  101. }
  102. func (db *ObjectDB) BatchUpert(ctx SQLContext, objs []cdssdk.Object) error {
  103. if len(objs) == 0 {
  104. return nil
  105. }
  106. sql := "insert into Object(ObjectID, PackageID, Path, Size, FileHash, Redundancy, CreateTime ,UpdateTime)" +
  107. " values(:ObjectID, :PackageID,:Path,:Size,:FileHash,:Redundancy, :CreateTime, :UpdateTime) as new" +
  108. " on duplicate key update PackageID = new.PackageID, Path = new.Path, Size = new.Size, FileHash = new.FileHash, Redundancy = new.Redundancy, UpdateTime = new.UpdateTime"
  109. return BatchNamedExec(ctx, sql, 8, objs, nil)
  110. }
  111. func (*ObjectDB) GetPackageObjects(ctx SQLContext, packageID cdssdk.PackageID) ([]model.Object, error) {
  112. var ret []model.TempObject
  113. err := sqlx.Select(ctx, &ret, "select * from Object where PackageID = ? order by ObjectID asc", packageID)
  114. return lo.Map(ret, func(o model.TempObject, idx int) model.Object { return o.ToObject() }), err
  115. }
  116. func (db *ObjectDB) GetPackageObjectDetails(ctx SQLContext, packageID cdssdk.PackageID) ([]stgmod.ObjectDetail, error) {
  117. var objs []model.TempObject
  118. err := sqlx.Select(ctx, &objs, "select * from Object where PackageID = ? order by ObjectID asc", packageID)
  119. if err != nil {
  120. return nil, fmt.Errorf("getting objects: %w", err)
  121. }
  122. rets := make([]stgmod.ObjectDetail, 0, len(objs))
  123. var allBlocks []stgmod.ObjectBlock
  124. err = sqlx.Select(ctx, &allBlocks, "select ObjectBlock.* from ObjectBlock, Object where PackageID = ? and ObjectBlock.ObjectID = Object.ObjectID order by ObjectBlock.ObjectID, `Index` asc", packageID)
  125. if err != nil {
  126. return nil, fmt.Errorf("getting all object blocks: %w", err)
  127. }
  128. var allPinnedObjs []cdssdk.PinnedObject
  129. err = sqlx.Select(ctx, &allPinnedObjs, "select PinnedObject.* from PinnedObject, Object where PackageID = ? and PinnedObject.ObjectID = Object.ObjectID order by PinnedObject.ObjectID", packageID)
  130. if err != nil {
  131. return nil, fmt.Errorf("getting all pinned objects: %w", err)
  132. }
  133. blksCur := 0
  134. pinnedsCur := 0
  135. for _, temp := range objs {
  136. detail := stgmod.ObjectDetail{
  137. Object: temp.ToObject(),
  138. }
  139. // 1. 查询Object和ObjectBlock时均按照ObjectID升序排序
  140. // 2. ObjectBlock结果集中的不同ObjectID数只会比Object结果集的少
  141. // 因此在两个结果集上同时从头开始遍历时,如果两边的ObjectID字段不同,那么一定是ObjectBlock这边的ObjectID > Object的ObjectID,
  142. // 此时让Object的遍历游标前进,直到两边的ObjectID再次相等
  143. for ; blksCur < len(allBlocks); blksCur++ {
  144. if allBlocks[blksCur].ObjectID != temp.ObjectID {
  145. break
  146. }
  147. detail.Blocks = append(detail.Blocks, allBlocks[blksCur])
  148. }
  149. for ; pinnedsCur < len(allPinnedObjs); pinnedsCur++ {
  150. if allPinnedObjs[pinnedsCur].ObjectID != temp.ObjectID {
  151. break
  152. }
  153. detail.PinnedAt = append(detail.PinnedAt, allPinnedObjs[pinnedsCur].NodeID)
  154. }
  155. rets = append(rets, detail)
  156. }
  157. return rets, nil
  158. }
  159. func (db *ObjectDB) BatchAdd(ctx SQLContext, packageID cdssdk.PackageID, adds []coormq.AddObjectEntry) ([]cdssdk.Object, error) {
  160. if len(adds) == 0 {
  161. return nil, nil
  162. }
  163. objs := make([]cdssdk.Object, 0, len(adds))
  164. for _, add := range adds {
  165. objs = append(objs, cdssdk.Object{
  166. PackageID: packageID,
  167. Path: add.Path,
  168. Size: add.Size,
  169. FileHash: add.FileHash,
  170. Redundancy: cdssdk.NewNoneRedundancy(), // 首次上传默认使用不分块的none模式
  171. CreateTime: add.UploadTime,
  172. UpdateTime: add.UploadTime,
  173. })
  174. }
  175. err := db.BatchUpsertByPackagePath(ctx, objs)
  176. if err != nil {
  177. return nil, fmt.Errorf("batch create or update objects: %w", err)
  178. }
  179. pathes := make([]string, 0, len(adds))
  180. for _, add := range adds {
  181. pathes = append(pathes, add.Path)
  182. }
  183. // 这里可以不用检查查询结果是否与pathes的数量相同
  184. addedObjs, err := db.BatchGetByPackagePath(ctx, packageID, pathes)
  185. if err != nil {
  186. return nil, fmt.Errorf("batch get object ids: %w", err)
  187. }
  188. // 所有需要按索引来一一对应的数据都需要进行排序
  189. adds = sort2.Sort(adds, func(l, r coormq.AddObjectEntry) int { return strings.Compare(l.Path, r.Path) })
  190. addedObjs = sort2.Sort(addedObjs, func(l, r cdssdk.Object) int { return strings.Compare(l.Path, r.Path) })
  191. addedObjIDs := make([]cdssdk.ObjectID, len(addedObjs))
  192. for i := range addedObjs {
  193. addedObjIDs[i] = addedObjs[i].ObjectID
  194. }
  195. err = db.ObjectBlock().BatchDeleteByObjectID(ctx, addedObjIDs)
  196. if err != nil {
  197. return nil, fmt.Errorf("batch delete object blocks: %w", err)
  198. }
  199. err = db.PinnedObject().BatchDeleteByObjectID(ctx, addedObjIDs)
  200. if err != nil {
  201. return nil, fmt.Errorf("batch delete pinned objects: %w", err)
  202. }
  203. objBlocks := make([]stgmod.ObjectBlock, 0, len(adds))
  204. for i, add := range adds {
  205. objBlocks = append(objBlocks, stgmod.ObjectBlock{
  206. ObjectID: addedObjIDs[i],
  207. Index: 0,
  208. NodeID: add.NodeID,
  209. FileHash: add.FileHash,
  210. })
  211. }
  212. err = db.ObjectBlock().BatchCreate(ctx, objBlocks)
  213. if err != nil {
  214. return nil, fmt.Errorf("batch create object blocks: %w", err)
  215. }
  216. caches := make([]model.Cache, 0, len(adds))
  217. for _, add := range adds {
  218. caches = append(caches, model.Cache{
  219. FileHash: add.FileHash,
  220. NodeID: add.NodeID,
  221. CreateTime: time.Now(),
  222. Priority: 0,
  223. })
  224. }
  225. err = db.Cache().BatchCreate(ctx, caches)
  226. if err != nil {
  227. return nil, fmt.Errorf("batch create caches: %w", err)
  228. }
  229. return addedObjs, nil
  230. }
  231. func (db *ObjectDB) BatchUpdateRedundancy(ctx SQLContext, objs []coormq.UpdatingObjectRedundancy) error {
  232. if len(objs) == 0 {
  233. return nil
  234. }
  235. nowTime := time.Now()
  236. objIDs := make([]cdssdk.ObjectID, 0, len(objs))
  237. dummyObjs := make([]cdssdk.Object, 0, len(objs))
  238. for _, obj := range objs {
  239. objIDs = append(objIDs, obj.ObjectID)
  240. dummyObjs = append(dummyObjs, cdssdk.Object{
  241. ObjectID: obj.ObjectID,
  242. Redundancy: obj.Redundancy,
  243. CreateTime: nowTime,
  244. UpdateTime: nowTime,
  245. })
  246. }
  247. // 目前只能使用这种方式来同时更新大量数据
  248. err := BatchNamedExec(ctx,
  249. "insert into Object(ObjectID, PackageID, Path, Size, FileHash, Redundancy, CreateTime, UpdateTime)"+
  250. " values(:ObjectID, :PackageID, :Path, :Size, :FileHash, :Redundancy, :CreateTime, :UpdateTime) as new"+
  251. " on duplicate key update Redundancy=new.Redundancy", 8, dummyObjs, nil)
  252. if err != nil {
  253. return fmt.Errorf("batch update object redundancy: %w", err)
  254. }
  255. // 删除原本所有的编码块记录,重新添加
  256. err = db.ObjectBlock().BatchDeleteByObjectID(ctx, objIDs)
  257. if err != nil {
  258. return fmt.Errorf("batch delete object blocks: %w", err)
  259. }
  260. // 删除原本Pin住的Object。暂不考虑FileHash没有变化的情况
  261. err = db.PinnedObject().BatchDeleteByObjectID(ctx, objIDs)
  262. if err != nil {
  263. return fmt.Errorf("batch delete pinned object: %w", err)
  264. }
  265. blocks := make([]stgmod.ObjectBlock, 0, len(objs))
  266. for _, obj := range objs {
  267. blocks = append(blocks, obj.Blocks...)
  268. }
  269. err = db.ObjectBlock().BatchCreate(ctx, blocks)
  270. if err != nil {
  271. return fmt.Errorf("batch create object blocks: %w", err)
  272. }
  273. caches := make([]model.Cache, 0, len(objs))
  274. for _, obj := range objs {
  275. for _, blk := range obj.Blocks {
  276. caches = append(caches, model.Cache{
  277. FileHash: blk.FileHash,
  278. NodeID: blk.NodeID,
  279. CreateTime: time.Now(),
  280. Priority: 0,
  281. })
  282. }
  283. }
  284. err = db.Cache().BatchCreate(ctx, caches)
  285. if err != nil {
  286. return fmt.Errorf("batch create object caches: %w", err)
  287. }
  288. pinneds := make([]cdssdk.PinnedObject, 0, len(objs))
  289. for _, obj := range objs {
  290. for _, p := range obj.PinnedAt {
  291. pinneds = append(pinneds, cdssdk.PinnedObject{
  292. ObjectID: obj.ObjectID,
  293. NodeID: p,
  294. CreateTime: time.Now(),
  295. })
  296. }
  297. }
  298. err = db.PinnedObject().BatchTryCreate(ctx, pinneds)
  299. if err != nil {
  300. return fmt.Errorf("batch create pinned objects: %w", err)
  301. }
  302. return nil
  303. }
  304. func (*ObjectDB) BatchDelete(ctx SQLContext, ids []cdssdk.ObjectID) error {
  305. if len(ids) == 0 {
  306. return nil
  307. }
  308. query, args, err := sqlx.In("delete from Object where ObjectID in (?)", ids)
  309. if err != nil {
  310. return err
  311. }
  312. _, err = ctx.Exec(query, args...)
  313. return err
  314. }
  315. func (*ObjectDB) DeleteInPackage(ctx SQLContext, packageID cdssdk.PackageID) error {
  316. _, err := ctx.Exec("delete from Object where PackageID = ?", packageID)
  317. return err
  318. }

本项目旨在将云际存储公共基础设施化,使个人及企业可低门槛使用高效的云际存储服务(安装开箱即用云际存储客户端即可,无需关注其他组件的部署),同时支持用户灵活便捷定制云际存储的功能细节。