main.go 6.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182
  1. package main
  2. import (
  3. commonConfig "cicv-data-closedloop/aarch64/pjibot_guide/common/config"
  4. commonService "cicv-data-closedloop/aarch64/pjibot_guide/common/service"
  5. "cicv-data-closedloop/aarch64/pjibot_guide/common/variable"
  6. "cicv-data-closedloop/aarch64/pjibot_guide/control/pkg"
  7. "cicv-data-closedloop/common/config/c_log"
  8. "cicv-data-closedloop/common/entity"
  9. "cicv-data-closedloop/common/util"
  10. "fmt"
  11. "net/rpc"
  12. "os"
  13. "runtime"
  14. "time"
  15. )
  16. var (
  17. applicationName = "pji-control"
  18. localStatus = "idle"
  19. cloudStatus = "NONE"
  20. lastLocalStatus = "idle"
  21. lastCloudStatus = "NONE"
  22. localTurnLength = 1 // s,本地状态刷新时间
  23. cloudTurnLength = 60 // s,云端状态刷新时间
  24. renewTurnLength = 3 // s,续约状态刷新时间
  25. waitStopLength = 1 // min,停止master前等待时间
  26. launchedFlag = false
  27. renewedFlag = false
  28. renewTimer *time.Timer // 续约定时器
  29. RenewDur = 5 // min, 续约时间
  30. maxRetryCount = 10 // 查询配置最大重试次数
  31. )
  32. func init() {
  33. runtime.GOMAXPROCS(1)
  34. // 初始化日志配置
  35. c_log.InitLog(variable.LogDir, applicationName)
  36. // 初始化本地配置文件(第1处配置,在本地文件)
  37. commonConfig.InitLocalConfig(variable.LocalConfigPath)
  38. // 初始化Oss连接信息
  39. commonConfig.InitOssConfig()
  40. // 初始化业务逻辑配置信息,配置文件在oss上(第2处配置,在oss文件)
  41. commonConfig.InitCloudConfig()
  42. // 初始化rpc客户端,用于杀死旧的采集程序
  43. // 初始化websocket配置
  44. commonConfig.InitWebsocketConfig()
  45. }
  46. func initRenew() {
  47. c_log.GlobalLogger.Info("启动定时器 - 开始。")
  48. if renewTimer != nil {
  49. renewTimer.Stop()
  50. }
  51. renewedFlag = true
  52. renewTimer = time.AfterFunc(time.Duration(RenewDur)*time.Minute, func() {
  53. renewedFlag = false
  54. })
  55. c_log.GlobalLogger.Infof("定时时间【%v】分钟 - 成功。", RenewDur)
  56. }
  57. func renew() {
  58. for {
  59. time.Sleep(time.Duration(renewTurnLength) * time.Second)
  60. if localStatus == "running" && launchedFlag && !renewedFlag { // 设备处于运行状态,数采程序已启动,且尚未续约
  61. c_log.GlobalLogger.Info("设备仍处于运行状态,续约 - 开始。")
  62. if renewTimer != nil {
  63. renewTimer.Stop()
  64. }
  65. renewedFlag = true
  66. renewTimer = time.AfterFunc(time.Duration(RenewDur)*time.Minute, func() {
  67. renewedFlag = false
  68. })
  69. c_log.GlobalLogger.Infof("续约时间【%v】分钟 - 成功。", RenewDur)
  70. }
  71. }
  72. }
  73. func startMasterNode() {
  74. c_log.GlobalLogger.Info("获取数据闭环平台最新配置。")
  75. if commonConfig.CheckPlatformConfigStatus(maxRetryCount) {
  76. c_log.GlobalLogger.Info("查询到数据闭环平台有配置任务。")
  77. commonConfig.InitPlatformConfig()
  78. if _, err := util.ExecuteWithPath(commonConfig.LocalConfig.RestartCmd.Dir, commonConfig.LocalConfig.RestartCmd.Name, commonConfig.LocalConfig.RestartCmd.Args...); err != nil {
  79. c_log.GlobalLogger.Info("启动新程序失败,【path】=", commonConfig.LocalConfig.RestartCmd.Dir, "【cmd】=", commonConfig.LocalConfig.RestartCmd.Name, commonConfig.LocalConfig.RestartCmd.Args, ":", err)
  80. os.Exit(-1)
  81. }
  82. c_log.GlobalLogger.Info("启动任务,本地执行启动命令:【path】=", commonConfig.LocalConfig.RestartCmd.Dir, "【cmd】=", commonConfig.LocalConfig.RestartCmd.Name, commonConfig.LocalConfig.RestartCmd.Args)
  83. initRenew()
  84. launchedFlag = true
  85. c_log.GlobalLogger.Info("数采程序启动 - 成功。")
  86. } else {
  87. c_log.GlobalLogger.Error("查询到数据闭环平台没有配置任务,不启动数采程序。")
  88. }
  89. }
  90. func stopMasterNode() {
  91. // 发送rpc信号杀死采集程序
  92. var killArgs commonService.KillSignal
  93. killArgs = commonService.KillSignal{NodeName: "master", DropUploadData: commonConfig.PlatformConfig.DropUploadData, Restart: false}
  94. c_log.GlobalLogger.Info("杀死任务,发送rpc结束信号:", killArgs)
  95. KillRpcClient, err := rpc.Dial("tcp", commonConfig.LocalConfig.Node.Ip+":"+commonConfig.CloudConfig.RpcPort)
  96. if err != nil {
  97. // 此处如果连接失败说明采集程序已经停止了
  98. lastCloudStatus = "NONE"
  99. c_log.GlobalLogger.Error("采集程序已经停止:", err)
  100. return
  101. }
  102. reply := 0
  103. if err = KillRpcClient.Call("KillService.Kill", killArgs, &reply); err != nil {
  104. c_log.GlobalLogger.Error("发送 rpc 请求到 master 报错:", err)
  105. }
  106. c_log.GlobalLogger.Info("结束任务后,将数据闭环平台配置置空。")
  107. commonConfig.PlatformConfig = commonConfig.PlatformConfigStruct{}
  108. if err = KillRpcClient.Close(); err != nil {
  109. // 不做处理
  110. }
  111. launchedFlag = false
  112. c_log.GlobalLogger.Info("数采程序关闭 - 成功。")
  113. }
  114. func main() {
  115. // 更新本地任务状态
  116. //go pkg.GetLocalStatus(&localStatus, &lastLocalStatus, localTurnLength)
  117. // 更新云端任务状态
  118. go pkg.GetCloudStatus(&cloudStatus, &lastCloudStatus, cloudTurnLength)
  119. // 定期检查本地任务状态,执行续约,避免短时间内多次启停
  120. go renew()
  121. // 云端任务状态负责更新配置
  122. go pkg.GetCloudConfig(&cloudStatus, &lastCloudStatus, cloudTurnLength)
  123. for {
  124. if launchedFlag { // 当前已启动master节点
  125. time.Sleep(time.Duration(cloudTurnLength) * time.Second)
  126. } else {
  127. time.Sleep(time.Duration(localTurnLength) * time.Second)
  128. }
  129. fmt.Println("localStatus: ", localStatus, "lastLocalStatus: ", lastLocalStatus)
  130. fmt.Println("cloudStatus: ", cloudStatus, "lastCloudStatus: ", lastCloudStatus)
  131. // 综合判断 cloudStatus 和 localStatus
  132. // cloudStatus
  133. // UN_CHANGE 没有新的任务,无需更改
  134. // CHANGE 有新的任务,需要杀死旧的数采任务并重启
  135. // NONE 设备没有配置任务,需要杀死旧的数采任务
  136. // localStatus
  137. // idle 空闲状态,此状态下不启动数采任务
  138. // running 繁忙状态,此状态需要启动数采任务
  139. // error 错误状态,此状态下不启动数采任务
  140. // 本地任务状态负责启停master
  141. if localStatus == "running" {
  142. if !launchedFlag { // 目前未启动数采程序
  143. c_log.GlobalLogger.Info("数采程序启动 - 开始。")
  144. startMasterNode()
  145. }
  146. } else if localStatus == "idle" {
  147. if !renewedFlag && launchedFlag && len(entity.TimeWindowConsumerQueue) == 0 {
  148. time.Sleep(time.Duration(waitStopLength) * time.Minute)
  149. c_log.GlobalLogger.Info("设备不在运行状态且没有待处理的数据,数采程序关闭 - 开始。")
  150. stopMasterNode()
  151. }
  152. } else if localStatus == "error" {
  153. c_log.GlobalLogger.Error("设备运行状态出错,停止数采程序。")
  154. stopMasterNode()
  155. } else {
  156. c_log.GlobalLogger.Error("未知的设备运行状态。【status】=", localStatus)
  157. }
  158. }
  159. }