mq.go 7.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233
  1. package mq
  2. import (
  3. "context"
  4. "encoding/json"
  5. "errors"
  6. "fmt"
  7. "log"
  8. "strings"
  9. "time"
  10. mqtt "github.com/eclipse/paho.mqtt.golang"
  11. "github.com/gravitl/netmaker/database"
  12. "github.com/gravitl/netmaker/logger"
  13. "github.com/gravitl/netmaker/logic"
  14. "github.com/gravitl/netmaker/models"
  15. "github.com/gravitl/netmaker/servercfg"
  16. "github.com/gravitl/netmaker/serverctl"
  17. )
  18. const KEEPALIVE_TIMEOUT = 60 //timeout in seconds
  19. const MQ_DISCONNECT = 250
  20. // DefaultHandler default message queue handler - only called when GetDebug == true
  21. var DefaultHandler mqtt.MessageHandler = func(client mqtt.Client, msg mqtt.Message) {
  22. logger.Log(0, "MQTT Message: Topic: ", string(msg.Topic()), " Message: ", string(msg.Payload()))
  23. }
  24. // Ping message Handler -- handles ping topic from client nodes
  25. var Ping mqtt.MessageHandler = func(client mqtt.Client, msg mqtt.Message) {
  26. logger.Log(0, "Ping Handler: ", msg.Topic())
  27. go func() {
  28. id, err := GetID(msg.Topic())
  29. if err != nil {
  30. logger.Log(0, "error getting node.ID sent on ping topic ")
  31. return
  32. }
  33. node, err := logic.GetNodeByID(id)
  34. if err != nil {
  35. logger.Log(0, "mq-ping error getting node: ", err.Error())
  36. record, err := database.FetchRecord(database.NODES_TABLE_NAME, id)
  37. if err != nil {
  38. logger.Log(0, "error reading database ", err.Error())
  39. return
  40. }
  41. logger.Log(0, "record from database")
  42. logger.Log(0, record)
  43. return
  44. }
  45. _, decryptErr := decryptMsg(&node, msg.Payload())
  46. if decryptErr != nil {
  47. logger.Log(0, "error updating node ", node.ID, err.Error())
  48. return
  49. }
  50. node.SetLastCheckIn()
  51. if err := logic.UpdateNode(&node, &node); err != nil {
  52. logger.Log(0, "error updating node ", err.Error())
  53. }
  54. logger.Log(3, "ping processed for node", node.ID)
  55. // --TODO --set client version once feature is implemented.
  56. //node.SetClientVersion(msg.Payload())
  57. }()
  58. }
  59. // UpdateNode message Handler -- handles updates from client nodes
  60. var UpdateNode mqtt.MessageHandler = func(client mqtt.Client, msg mqtt.Message) {
  61. go func() {
  62. id, err := GetID(msg.Topic())
  63. if err != nil {
  64. logger.Log(1, "error getting node.ID sent on ", msg.Topic(), err.Error())
  65. return
  66. }
  67. currentNode, err := logic.GetNodeByID(id)
  68. if err != nil {
  69. logger.Log(1, "error getting node ", id, err.Error())
  70. return
  71. }
  72. decrypted, decryptErr := decryptMsg(&currentNode, msg.Payload())
  73. if decryptErr != nil {
  74. logger.Log(1, "failed to decrypt message for node ", id, decryptErr.Error())
  75. return
  76. }
  77. logger.Log(1, "Update Node Handler", id)
  78. var newNode models.Node
  79. if err := json.Unmarshal(decrypted, &newNode); err != nil {
  80. logger.Log(1, "error unmarshaling payload ", err.Error())
  81. return
  82. }
  83. if err := logic.UpdateNode(&currentNode, &newNode); err != nil {
  84. logger.Log(1, "error saving node", err.Error())
  85. }
  86. if err := PublishPeerUpdate(&newNode); err != nil {
  87. logger.Log(1, "error publishing peer update ", err.Error())
  88. return
  89. }
  90. logger.Log(1, "no need to update peers")
  91. }()
  92. }
  93. // PublishPeerUpdate --- deterines and publishes a peer update to all the peers of a node
  94. func PublishPeerUpdate(newNode *models.Node) error {
  95. networkNodes, err := logic.GetNetworkNodes(newNode.Network)
  96. if err != nil {
  97. logger.Log(1, "err getting Network Nodes", err.Error())
  98. return err
  99. }
  100. for _, node := range networkNodes {
  101. if node.IsServer == "yes" || node.ID == newNode.ID {
  102. log.Println("skipping update on " + node.Name + " : " + node.ID)
  103. continue
  104. }
  105. log.Println("running update on " + node.Name + " : " + node.ID)
  106. peerUpdate, err := logic.GetPeerUpdate(&node)
  107. if err != nil {
  108. logger.Log(1, "error getting peer update for node", node.ID, err.Error())
  109. continue
  110. }
  111. data, err := json.Marshal(&peerUpdate)
  112. if err != nil {
  113. logger.Log(2, "error marshaling peer update for node", node.ID, err.Error())
  114. continue
  115. }
  116. if err = publish(&node, fmt.Sprintf("peers/%s/%s", node.Network, node.ID), data); err != nil {
  117. logger.Log(1, "failed to publish peer update for node", node.ID)
  118. } else {
  119. logger.Log(1, fmt.Sprintf("sent peer update for node %s on network: %s ", node.Name, node.Network))
  120. }
  121. }
  122. return nil
  123. }
  124. // GetID -- decodes a message queue topic and returns the embedded node.ID
  125. func GetID(topic string) (string, error) {
  126. parts := strings.Split(topic, "/")
  127. count := len(parts)
  128. if count == 1 {
  129. return "", errors.New("invalid topic")
  130. }
  131. //the last part of the topic will be the node.ID
  132. return parts[count-1], nil
  133. }
  134. // NodeUpdate -- publishes a node update
  135. func NodeUpdate(node *models.Node) error {
  136. if !servercfg.IsMessageQueueBackend() {
  137. return nil
  138. }
  139. logger.Log(3, "publishing node update to "+node.Name)
  140. data, err := json.Marshal(node)
  141. if err != nil {
  142. logger.Log(2, "error marshalling node update ", err.Error())
  143. return err
  144. }
  145. if err = publish(node, fmt.Sprintf("update/%s/%s", node.Network, node.ID), data); err != nil {
  146. logger.Log(2, "error publishing node update to peer ", node.ID, err.Error())
  147. return err
  148. }
  149. return nil
  150. }
  151. // SetupMQTT creates a connection to broker and return client
  152. func SetupMQTT() mqtt.Client {
  153. opts := mqtt.NewClientOptions()
  154. broker := servercfg.GetMessageQueueEndpoint()
  155. opts.AddBroker(broker)
  156. client := mqtt.NewClient(opts)
  157. tperiod := time.Now().Add(10 * time.Second)
  158. for {
  159. if token := client.Connect(); token.Wait() && token.Error() != nil {
  160. logger.Log(2, "unable to connect to broker, retrying ...")
  161. if time.Now().After(tperiod) {
  162. log.Fatal(0, "could not connect to broker, exiting ...", token.Error())
  163. }
  164. } else {
  165. break
  166. }
  167. time.Sleep(2 * time.Second)
  168. }
  169. logger.Log(2, "connected to message queue", broker)
  170. return client
  171. }
  172. // Keepalive -- periodically pings all nodes to let them know server is still alive and doing well
  173. func Keepalive(ctx context.Context) {
  174. for {
  175. select {
  176. case <-ctx.Done():
  177. return
  178. case <-time.After(time.Second * KEEPALIVE_TIMEOUT):
  179. client := SetupMQTT()
  180. networks, err := logic.GetNetworks()
  181. if err != nil {
  182. logger.Log(1, "error retrieving networks for keepalive", err.Error())
  183. }
  184. for _, network := range networks {
  185. var id string
  186. for _, servAddr := range network.DefaultServerAddrs {
  187. if servAddr.IsLeader {
  188. id = servAddr.ID
  189. }
  190. }
  191. serverNode, errN := logic.GetNodeByID(id)
  192. if errN == nil {
  193. serverNode.SetLastCheckIn()
  194. logic.UpdateNode(&serverNode, &serverNode)
  195. if network.DefaultUDPHolePunch == "yes" {
  196. logic.ShouldPublishPeerPorts(&serverNode)
  197. }
  198. err = PublishPeerUpdate(&serverNode)
  199. if err != nil {
  200. logger.Log(1, "error publishing udp port updates", err.Error())
  201. }
  202. }
  203. if id == "" {
  204. logger.Log(0, "leader not defined for network", network.NetID)
  205. continue
  206. }
  207. if token := client.Publish("serverkeepalive/"+id, 0, false, servercfg.GetVersion()); token.Wait() && token.Error() != nil {
  208. logger.Log(1, "error publishing server keepalive for network", network.NetID, token.Error().Error())
  209. } else {
  210. logger.Log(2, "keepalive sent for network", network.NetID)
  211. }
  212. err = serverctl.SyncServerNetwork(network.NetID)
  213. if err != nil {
  214. logger.Log(1, "error syncing server network", err.Error())
  215. }
  216. }
  217. client.Disconnect(MQ_DISCONNECT)
  218. }
  219. }
  220. }