publishers.go 9.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321
  1. package mq
  2. import (
  3. "encoding/json"
  4. "errors"
  5. "fmt"
  6. "time"
  7. "github.com/gravitl/netmaker/logger"
  8. "github.com/gravitl/netmaker/logic"
  9. "github.com/gravitl/netmaker/logic/metrics"
  10. "github.com/gravitl/netmaker/models"
  11. "github.com/gravitl/netmaker/nm-proxy/manager"
  12. "github.com/gravitl/netmaker/servercfg"
  13. "github.com/gravitl/netmaker/serverctl"
  14. )
  15. // PublishPeerUpdate --- deterines and publishes a peer update to all the peers of a node
  16. func PublishPeerUpdate(newNode *models.Node, publishToSelf bool) error {
  17. if !servercfg.IsMessageQueueBackend() {
  18. return nil
  19. }
  20. networkNodes, err := logic.GetNetworkNodes(newNode.Network)
  21. if err != nil {
  22. logger.Log(1, "err getting Network Nodes", err.Error())
  23. return err
  24. }
  25. for _, node := range networkNodes {
  26. // err := PublishProxyUpdate(manager.AddInterface, &node)
  27. // if err != nil {
  28. // logger.Log(1, "failed to publish proxy update to node", node.Name, "on network", node.Network, ":", err.Error())
  29. // }
  30. if node.IsServer == "yes" {
  31. if servercfg.IsProxyEnabled() {
  32. err := PublishProxyUpdate(manager.AddInterface, &node)
  33. if err != nil {
  34. logger.Log(0, "failed to send proxy update for server: ", err.Error())
  35. }
  36. }
  37. continue
  38. }
  39. if !publishToSelf && newNode.ID == node.ID {
  40. //skip self
  41. continue
  42. }
  43. err = PublishSinglePeerUpdate(&node)
  44. if err != nil {
  45. logger.Log(1, "failed to publish peer update to node", node.Name, "on network", node.Network, ":", err.Error())
  46. }
  47. }
  48. return err
  49. }
  50. func PublishProxyUpdate(action manager.ProxyAction, node *models.Node) error {
  51. peerUpdates, err := logic.GetPeersForProxy(node, false)
  52. if err != nil {
  53. return err
  54. }
  55. err = ProxyUpdate(&manager.ManagerAction{
  56. Action: action,
  57. Payload: peerUpdates}, node)
  58. if err != nil {
  59. logger.Log(1, "failed to send proxy update: ", err.Error())
  60. return err
  61. }
  62. return nil
  63. }
  64. // PublishSinglePeerUpdate --- determines and publishes a peer update to one node
  65. func PublishSinglePeerUpdate(node *models.Node) error {
  66. peerUpdate, err := logic.GetPeerUpdate(node)
  67. if err != nil {
  68. return err
  69. }
  70. if node.Proxy {
  71. proxyUpdate, err := logic.GetPeersForProxy(node, false)
  72. if err != nil {
  73. return err
  74. }
  75. peerUpdate.ProxyUpdate = manager.ManagerAction{
  76. Action: manager.AddInterface,
  77. Payload: proxyUpdate,
  78. }
  79. }
  80. data, err := json.Marshal(&peerUpdate)
  81. if err != nil {
  82. return err
  83. }
  84. return publish(node, fmt.Sprintf("peers/%s/%s", node.Network, node.ID), data)
  85. }
  86. // PublishPeerUpdate --- publishes a peer update to all the peers of a node
  87. func PublishExtPeerUpdate(node *models.Node) error {
  88. var err error
  89. if logic.IsLocalServer(node) {
  90. if err = logic.ServerUpdate(node, false); err != nil {
  91. logger.Log(1, "server node:", node.ID, "failed to update peers with ext clients")
  92. return err
  93. } else {
  94. return nil
  95. }
  96. }
  97. if !servercfg.IsMessageQueueBackend() {
  98. return nil
  99. }
  100. peerUpdate, err := logic.GetPeerUpdate(node)
  101. if err != nil {
  102. return err
  103. }
  104. data, err := json.Marshal(&peerUpdate)
  105. if err != nil {
  106. return err
  107. }
  108. if err = publish(node, fmt.Sprintf("peers/%s/%s", node.Network, node.ID), data); err != nil {
  109. return err
  110. }
  111. go PublishPeerUpdate(node, false)
  112. return nil
  113. }
  114. // NodeUpdate -- publishes a node update
  115. func NodeUpdate(node *models.Node) error {
  116. var err error
  117. if !servercfg.IsMessageQueueBackend() || node.IsServer == "yes" {
  118. return nil
  119. }
  120. logger.Log(3, "publishing node update to "+node.Name)
  121. if len(node.NetworkSettings.AccessKeys) > 0 {
  122. node.NetworkSettings.AccessKeys = []models.AccessKey{} // not to be sent (don't need to spread access keys around the network; we need to know how to reach other nodes, not become them)
  123. }
  124. if node.Proxy {
  125. err = PublishProxyUpdate(manager.AddInterface, node)
  126. if err != nil {
  127. logger.Log(1, "failed to publish proxy update to node", node.Name, "on network", node.Network, ":", err.Error())
  128. }
  129. } else {
  130. data, err := json.Marshal(node)
  131. if err != nil {
  132. logger.Log(2, "error marshalling node update ", err.Error())
  133. return err
  134. }
  135. if err = publish(node, fmt.Sprintf("update/%s/%s", node.Network, node.ID), data); err != nil {
  136. logger.Log(2, "error publishing node update to peer ", node.ID, err.Error())
  137. return err
  138. }
  139. }
  140. return nil
  141. }
  142. //ProxyUpdate -- publishes updates to peers related to proxy
  143. func ProxyUpdate(proxyPayload *manager.ManagerAction, node *models.Node) error {
  144. if !servercfg.IsMessageQueueBackend() {
  145. return nil
  146. }
  147. if node.IsServer == "yes" {
  148. logic.ProxyMgmChan <- proxyPayload
  149. }
  150. logger.Log(3, "publishing proxy update to "+node.Name)
  151. data, err := json.Marshal(proxyPayload)
  152. if err != nil {
  153. logger.Log(2, "error marshalling node update ", err.Error())
  154. return err
  155. }
  156. if err = publish(node, fmt.Sprintf("proxy/%s/%s", node.Network, node.ID), data); err != nil {
  157. logger.Log(2, "error publishing proxy update to peer ", node.ID, err.Error())
  158. return err
  159. }
  160. return nil
  161. }
  162. // sendPeers - retrieve networks, send peer ports to all peers
  163. func sendPeers() {
  164. networks, err := logic.GetNetworks()
  165. if err != nil {
  166. logger.Log(1, "error retrieving networks for keepalive", err.Error())
  167. }
  168. var force bool
  169. peer_force_send++
  170. if peer_force_send == 5 {
  171. // run iptables update to ensure gateways work correctly and mq is forwarded if containerized
  172. if servercfg.ManageIPTables() != "off" {
  173. serverctl.InitIPTables(false)
  174. }
  175. servercfg.SetHost()
  176. force = true
  177. peer_force_send = 0
  178. err := logic.TimerCheckpoint() // run telemetry & log dumps if 24 hours has passed..
  179. if err != nil {
  180. logger.Log(3, "error occurred on timer,", err.Error())
  181. }
  182. collectServerMetrics(networks[:])
  183. }
  184. for _, network := range networks {
  185. serverNode, errN := logic.GetNetworkServerLocal(network.NetID)
  186. if errN == nil {
  187. serverNode.SetLastCheckIn()
  188. if err := logic.UpdateNode(&serverNode, &serverNode); err != nil {
  189. logger.Log(0, "failed checkin for server node", serverNode.Name, "on network", network.NetID, err.Error())
  190. }
  191. }
  192. isLeader := logic.IsLeader(&serverNode)
  193. if errN == nil && isLeader {
  194. if network.DefaultUDPHolePunch == "yes" {
  195. if logic.ShouldPublishPeerPorts(&serverNode) || force {
  196. if force {
  197. logger.Log(2, "sending scheduled peer update (5 min)")
  198. }
  199. err = PublishPeerUpdate(&serverNode, false)
  200. if err != nil {
  201. logger.Log(1, "error publishing udp port updates for network", network.NetID)
  202. logger.Log(1, errN.Error())
  203. }
  204. }
  205. }
  206. } else {
  207. if isLeader {
  208. logger.Log(1, "unable to retrieve leader for network ", network.NetID)
  209. }
  210. logger.Log(2, "server checkin complete for server", serverNode.Name, "on network", network.NetID)
  211. serverctl.SyncServerNetwork(network.NetID)
  212. if errN != nil {
  213. logger.Log(1, errN.Error())
  214. }
  215. if servercfg.IsProxyEnabled() {
  216. serverctl.SyncServerNetworkWithProxy()
  217. }
  218. }
  219. }
  220. }
  221. // ServerStartNotify - notifies all non server nodes to pull changes after a restart
  222. func ServerStartNotify() error {
  223. nodes, err := logic.GetAllNodes()
  224. if err != nil {
  225. return err
  226. }
  227. for i := range nodes {
  228. nodes[i].Action = models.NODE_FORCE_UPDATE
  229. if err = NodeUpdate(&nodes[i]); err != nil {
  230. logger.Log(1, "error when notifying node", nodes[i].Name, " - ", nodes[i].ID, "of a server startup")
  231. }
  232. }
  233. return nil
  234. }
  235. // function to collect and store metrics for server nodes
  236. func collectServerMetrics(networks []models.Network) {
  237. if !servercfg.Is_EE {
  238. return
  239. }
  240. if len(networks) > 0 {
  241. for i := range networks {
  242. currentNetworkNodes, err := logic.GetNetworkNodes(networks[i].NetID)
  243. if err != nil {
  244. continue
  245. }
  246. currentServerNodes := logic.GetServerNodes(networks[i].NetID)
  247. if len(currentServerNodes) > 0 {
  248. for i := range currentServerNodes {
  249. if logic.IsLocalServer(&currentServerNodes[i]) {
  250. serverMetrics := logic.CollectServerMetrics(currentServerNodes[i].ID, currentNetworkNodes)
  251. if serverMetrics != nil {
  252. serverMetrics.NodeName = currentServerNodes[i].Name
  253. serverMetrics.NodeID = currentServerNodes[i].ID
  254. serverMetrics.IsServer = "yes"
  255. serverMetrics.Network = currentServerNodes[i].Network
  256. if err = metrics.GetExchangedBytesForNode(&currentServerNodes[i], serverMetrics); err != nil {
  257. logger.Log(1, fmt.Sprintf("failed to update exchanged bytes info for server: %s, err: %v",
  258. currentServerNodes[i].Name, err))
  259. }
  260. updateNodeMetrics(&currentServerNodes[i], serverMetrics)
  261. if err = logic.UpdateMetrics(currentServerNodes[i].ID, serverMetrics); err != nil {
  262. logger.Log(1, "failed to update metrics for server node", currentServerNodes[i].ID)
  263. }
  264. if servercfg.IsMetricsExporter() {
  265. logger.Log(2, "-------------> SERVER METRICS: ", fmt.Sprintf("%+v", serverMetrics))
  266. if err := pushMetricsToExporter(*serverMetrics); err != nil {
  267. logger.Log(2, "failed to push server metrics to exporter: ", err.Error())
  268. }
  269. }
  270. }
  271. }
  272. }
  273. }
  274. }
  275. }
  276. }
  277. func pushMetricsToExporter(metrics models.Metrics) error {
  278. logger.Log(2, "----> Pushing metrics to exporter")
  279. data, err := json.Marshal(metrics)
  280. if err != nil {
  281. return errors.New("failed to marshal metrics: " + err.Error())
  282. }
  283. if token := mqclient.Publish("metrics_exporter", 2, true, data); !token.WaitTimeout(MQ_TIMEOUT*time.Second) || token.Error() != nil {
  284. var err error
  285. if token.Error() == nil {
  286. err = errors.New("connection timeout")
  287. } else {
  288. err = token.Error()
  289. }
  290. return err
  291. }
  292. return nil
  293. }