You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

main.go 5.4 kB

2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
2 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189
  1. package main
  2. import (
  3. "fmt"
  4. "net"
  5. "os"
  6. "sync"
  7. log "gitlink.org.cn/cloudream/common/pkgs/logger"
  8. cdssdk "gitlink.org.cn/cloudream/common/sdks/storage"
  9. "gitlink.org.cn/cloudream/storage/agent/internal/config"
  10. "gitlink.org.cn/cloudream/storage/agent/internal/task"
  11. stgglb "gitlink.org.cn/cloudream/storage/common/globals"
  12. "gitlink.org.cn/cloudream/storage/common/pkgs/connectivity"
  13. "gitlink.org.cn/cloudream/storage/common/pkgs/distlock"
  14. agtrpc "gitlink.org.cn/cloudream/storage/common/pkgs/grpc/agent"
  15. "gitlink.org.cn/cloudream/storage/common/pkgs/ioswitch"
  16. // TODO 注册OpUnion,但在mq包中注册会造成循环依赖,所以只能放到这里
  17. _ "gitlink.org.cn/cloudream/storage/common/pkgs/ioswitch/ops"
  18. "google.golang.org/grpc"
  19. agtmq "gitlink.org.cn/cloudream/storage/common/pkgs/mq/agent"
  20. coormq "gitlink.org.cn/cloudream/storage/common/pkgs/mq/coordinator"
  21. grpcsvc "gitlink.org.cn/cloudream/storage/agent/internal/grpc"
  22. cmdsvc "gitlink.org.cn/cloudream/storage/agent/internal/mq"
  23. )
  24. // TODO 此数据是否在运行时会发生变化?
  25. var AgentIpList []string
  26. // 主程序入口
  27. func main() {
  28. // TODO: 将Agent的IP列表放到配置文件中读取
  29. AgentIpList = []string{"pcm01", "pcm1", "pcm2"}
  30. // 初始化配置
  31. err := config.Init()
  32. if err != nil {
  33. fmt.Printf("init config failed, err: %s", err.Error())
  34. os.Exit(1)
  35. }
  36. // 初始化日志系统
  37. err = log.Init(&config.Cfg().Logger)
  38. if err != nil {
  39. fmt.Printf("init logger failed, err: %s", err.Error())
  40. os.Exit(1)
  41. }
  42. // 初始化全局变量和连接池
  43. stgglb.InitLocal(&config.Cfg().Local)
  44. stgglb.InitMQPool(&config.Cfg().RabbitMQ)
  45. stgglb.InitAgentRPCPool(&agtrpc.PoolConfig{})
  46. stgglb.InitIPFSPool(&config.Cfg().IPFS)
  47. // 启动网络连通性检测,并进行一次就地检测
  48. conCol := connectivity.NewCollector(&config.Cfg().Connectivity, func(collector *connectivity.Collector) {
  49. log := log.WithField("Connectivity", "")
  50. // 从协调器MQ连接池获取客户端
  51. coorCli, err := stgglb.CoordinatorMQPool.Acquire()
  52. if err != nil {
  53. log.Warnf("acquire coordinator mq failed, err: %s", err.Error())
  54. return
  55. }
  56. // 确保在函数返回前释放客户端
  57. defer stgglb.CoordinatorMQPool.Release(coorCli)
  58. // 处理网络连通性数据,并更新到协调器
  59. cons := collector.GetAll()
  60. nodeCons := make([]cdssdk.NodeConnectivity, 0, len(cons))
  61. for _, con := range cons {
  62. var delay *float32
  63. if con.Delay != nil {
  64. v := float32(con.Delay.Microseconds()) / 1000
  65. delay = &v
  66. }
  67. nodeCons = append(nodeCons, cdssdk.NodeConnectivity{
  68. FromNodeID: *stgglb.Local.NodeID,
  69. ToNodeID: con.ToNodeID,
  70. Delay: delay,
  71. TestTime: con.TestTime,
  72. })
  73. }
  74. _, err = coorCli.UpdateNodeConnectivities(coormq.ReqUpdateNodeConnectivities(nodeCons))
  75. if err != nil {
  76. log.Warnf("update node connectivities: %v", err)
  77. }
  78. })
  79. conCol.CollectInPlace()
  80. // 初始化分布式锁服务
  81. distlock, err := distlock.NewService(&config.Cfg().DistLock)
  82. if err != nil {
  83. log.Fatalf("new ipfs failed, err: %s", err.Error())
  84. }
  85. // 初始化数据切换开关
  86. sw := ioswitch.NewSwitch()
  87. // 启动任务管理器和相关服务
  88. wg := sync.WaitGroup{}
  89. wg.Add(4)
  90. taskMgr := task.NewManager(distlock, &sw, &conCol)
  91. // 启动命令服务器
  92. agtSvr, err := agtmq.NewServer(cmdsvc.NewService(&taskMgr, &sw), config.Cfg().ID, &config.Cfg().RabbitMQ)
  93. if err != nil {
  94. log.Fatalf("new agent server failed, err: %s", err.Error())
  95. }
  96. agtSvr.OnError(func(err error) {
  97. log.Warnf("agent server err: %s", err.Error())
  98. })
  99. go serveAgentServer(agtSvr, &wg)
  100. // 启动面向客户端的GRPC服务
  101. listenAddr := config.Cfg().GRPC.MakeListenAddress()
  102. lis, err := net.Listen("tcp", listenAddr)
  103. if err != nil {
  104. log.Fatalf("listen on %s failed, err: %s", listenAddr, err.Error())
  105. }
  106. s := grpc.NewServer()
  107. agtrpc.RegisterAgentServer(s, grpcsvc.NewService(&sw))
  108. go serveGRPC(s, lis, &wg)
  109. // 启动分布式锁服务的处理程序
  110. go serveDistLock(distlock)
  111. // 等待所有服务结束
  112. wg.Wait()
  113. }
  114. // serveAgentServer 启动并服务一个命令服务器
  115. // server: 指向agtmq.Server的指针,代表要被服务的命令服务器
  116. // wg: 指向sync.WaitGroup的指针,用于等待服务器停止
  117. func serveAgentServer(server *agtmq.Server, wg *sync.WaitGroup) {
  118. log.Info("start serving command server")
  119. err := server.Serve()
  120. if err != nil {
  121. log.Errorf("command server stopped with error: %s", err.Error())
  122. }
  123. log.Info("command server stopped")
  124. wg.Done() // 表示服务器已经停止
  125. }
  126. // serveGRPC 启动并服务一个gRPC服务器
  127. // s: 指向grpc.Server的指针,代表要被服务的gRPC服务器
  128. // lis: 网络监听器,用于监听gRPC请求
  129. // wg: 指向sync.WaitGroup的指针,用于等待服务器停止
  130. func serveGRPC(s *grpc.Server, lis net.Listener, wg *sync.WaitGroup) {
  131. log.Info("start serving grpc")
  132. err := s.Serve(lis)
  133. if err != nil {
  134. log.Errorf("grpc stopped with error: %s", err.Error())
  135. }
  136. log.Info("grpc stopped")
  137. wg.Done() // 表示gRPC服务器已经停止
  138. }
  139. // serveDistLock 启动并服务一个分布式锁服务
  140. // svc: 指向distlock.Service的指针,代表要被服务的分布式锁服务
  141. func serveDistLock(svc *distlock.Service) {
  142. log.Info("start serving distlock")
  143. err := svc.Serve()
  144. if err != nil {
  145. log.Errorf("distlock stopped with error: %s", err.Error())
  146. }
  147. log.Info("distlock stopped")
  148. }

本项目旨在将云际存储公共基础设施化,使个人及企业可低门槛使用高效的云际存储服务(安装开箱即用云际存储客户端即可,无需关注其他组件的部署),同时支持用户灵活便捷定制云际存储的功能细节。