You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

main.go 5.6 kB

2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192
  1. package main
  2. import (
  3. "fmt"
  4. "net"
  5. "os"
  6. "sync"
  7. log "gitlink.org.cn/cloudream/common/pkgs/logger"
  8. cdssdk "gitlink.org.cn/cloudream/common/sdks/storage"
  9. "gitlink.org.cn/cloudream/storage/agent/internal/config"
  10. "gitlink.org.cn/cloudream/storage/agent/internal/task"
  11. stgglb "gitlink.org.cn/cloudream/storage/common/globals"
  12. "gitlink.org.cn/cloudream/storage/common/pkgs/connectivity"
  13. "gitlink.org.cn/cloudream/storage/common/pkgs/distlock"
  14. "gitlink.org.cn/cloudream/storage/common/pkgs/downloader"
  15. agtrpc "gitlink.org.cn/cloudream/storage/common/pkgs/grpc/agent"
  16. "gitlink.org.cn/cloudream/storage/common/pkgs/ioswitch"
  17. // TODO 注册OpUnion,但在mq包中注册会造成循环依赖,所以只能放到这里
  18. _ "gitlink.org.cn/cloudream/storage/common/pkgs/ioswitch/ops"
  19. "google.golang.org/grpc"
  20. agtmq "gitlink.org.cn/cloudream/storage/common/pkgs/mq/agent"
  21. coormq "gitlink.org.cn/cloudream/storage/common/pkgs/mq/coordinator"
  22. grpcsvc "gitlink.org.cn/cloudream/storage/agent/internal/grpc"
  23. cmdsvc "gitlink.org.cn/cloudream/storage/agent/internal/mq"
  24. )
  25. // TODO 此数据是否在运行时会发生变化?
  26. var AgentIpList []string
  27. // 主程序入口
  28. func main() {
  29. // TODO: 将Agent的IP列表放到配置文件中读取
  30. AgentIpList = []string{"pcm01", "pcm1", "pcm2"}
  31. // 初始化配置
  32. err := config.Init()
  33. if err != nil {
  34. fmt.Printf("init config failed, err: %s", err.Error())
  35. os.Exit(1)
  36. }
  37. // 初始化日志系统
  38. err = log.Init(&config.Cfg().Logger)
  39. if err != nil {
  40. fmt.Printf("init logger failed, err: %s", err.Error())
  41. os.Exit(1)
  42. }
  43. // 初始化全局变量和连接池
  44. stgglb.InitLocal(&config.Cfg().Local)
  45. stgglb.InitMQPool(&config.Cfg().RabbitMQ)
  46. stgglb.InitAgentRPCPool(&agtrpc.PoolConfig{})
  47. stgglb.InitIPFSPool(&config.Cfg().IPFS)
  48. // 启动网络连通性检测,并进行一次就地检测
  49. conCol := connectivity.NewCollector(&config.Cfg().Connectivity, func(collector *connectivity.Collector) {
  50. log := log.WithField("Connectivity", "")
  51. // 从协调器MQ连接池获取客户端
  52. coorCli, err := stgglb.CoordinatorMQPool.Acquire()
  53. if err != nil {
  54. log.Warnf("acquire coordinator mq failed, err: %s", err.Error())
  55. return
  56. }
  57. // 确保在函数返回前释放客户端
  58. defer stgglb.CoordinatorMQPool.Release(coorCli)
  59. // 处理网络连通性数据,并更新到协调器
  60. cons := collector.GetAll()
  61. nodeCons := make([]cdssdk.NodeConnectivity, 0, len(cons))
  62. for _, con := range cons {
  63. var delay *float32
  64. if con.Delay != nil {
  65. v := float32(con.Delay.Microseconds()) / 1000
  66. delay = &v
  67. }
  68. nodeCons = append(nodeCons, cdssdk.NodeConnectivity{
  69. FromNodeID: *stgglb.Local.NodeID,
  70. ToNodeID: con.ToNodeID,
  71. Delay: delay,
  72. TestTime: con.TestTime,
  73. })
  74. }
  75. _, err = coorCli.UpdateNodeConnectivities(coormq.ReqUpdateNodeConnectivities(nodeCons))
  76. if err != nil {
  77. log.Warnf("update node connectivities: %v", err)
  78. }
  79. })
  80. conCol.CollectInPlace()
  81. // 初始化分布式锁服务
  82. distlock, err := distlock.NewService(&config.Cfg().DistLock)
  83. if err != nil {
  84. log.Fatalf("new ipfs failed, err: %s", err.Error())
  85. }
  86. // 初始化数据切换开关
  87. sw := ioswitch.NewSwitch()
  88. dlder := downloader.NewDownloader(config.Cfg().Downloader)
  89. //处置协调端、客户端命令(可多建几个)
  90. wg := sync.WaitGroup{}
  91. wg.Add(4)
  92. taskMgr := task.NewManager(distlock, &sw, &conCol, &dlder)
  93. // 启动命令服务器
  94. agtSvr, err := agtmq.NewServer(cmdsvc.NewService(&taskMgr, &sw), config.Cfg().ID, &config.Cfg().RabbitMQ)
  95. if err != nil {
  96. log.Fatalf("new agent server failed, err: %s", err.Error())
  97. }
  98. agtSvr.OnError(func(err error) {
  99. log.Warnf("agent server err: %s", err.Error())
  100. })
  101. go serveAgentServer(agtSvr, &wg)
  102. // 启动面向客户端的GRPC服务
  103. listenAddr := config.Cfg().GRPC.MakeListenAddress()
  104. lis, err := net.Listen("tcp", listenAddr)
  105. if err != nil {
  106. log.Fatalf("listen on %s failed, err: %s", listenAddr, err.Error())
  107. }
  108. s := grpc.NewServer()
  109. agtrpc.RegisterAgentServer(s, grpcsvc.NewService(&sw))
  110. go serveGRPC(s, lis, &wg)
  111. // 启动分布式锁服务的处理程序
  112. go serveDistLock(distlock)
  113. // 等待所有服务结束
  114. wg.Wait()
  115. }
  116. // serveAgentServer 启动并服务一个命令服务器
  117. // server: 指向agtmq.Server的指针,代表要被服务的命令服务器
  118. // wg: 指向sync.WaitGroup的指针,用于等待服务器停止
  119. func serveAgentServer(server *agtmq.Server, wg *sync.WaitGroup) {
  120. log.Info("start serving command server")
  121. err := server.Serve()
  122. if err != nil {
  123. log.Errorf("command server stopped with error: %s", err.Error())
  124. }
  125. log.Info("command server stopped")
  126. wg.Done() // 表示服务器已经停止
  127. }
  128. // serveGRPC 启动并服务一个gRPC服务器
  129. // s: 指向grpc.Server的指针,代表要被服务的gRPC服务器
  130. // lis: 网络监听器,用于监听gRPC请求
  131. // wg: 指向sync.WaitGroup的指针,用于等待服务器停止
  132. func serveGRPC(s *grpc.Server, lis net.Listener, wg *sync.WaitGroup) {
  133. log.Info("start serving grpc")
  134. err := s.Serve(lis)
  135. if err != nil {
  136. log.Errorf("grpc stopped with error: %s", err.Error())
  137. }
  138. log.Info("grpc stopped")
  139. wg.Done() // 表示gRPC服务器已经停止
  140. }
  141. // serveDistLock 启动并服务一个分布式锁服务
  142. // svc: 指向distlock.Service的指针,代表要被服务的分布式锁服务
  143. func serveDistLock(svc *distlock.Service) {
  144. log.Info("start serving distlock")
  145. err := svc.Serve()
  146. if err != nil {
  147. log.Errorf("distlock stopped with error: %s", err.Error())
  148. }
  149. log.Info("distlock stopped")
  150. }

本项目旨在将云际存储公共基础设施化,使个人及企业可低门槛使用高效的云际存储服务(安装开箱即用云际存储客户端即可,无需关注其他组件的部署),同时支持用户灵活便捷定制云际存储的功能细节。