mq.go 8.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302
  1. package mq
  2. import (
  3. "context"
  4. "encoding/json"
  5. "errors"
  6. "fmt"
  7. "log"
  8. "strings"
  9. "time"
  10. mqtt "github.com/eclipse/paho.mqtt.golang"
  11. "github.com/gravitl/netmaker/database"
  12. "github.com/gravitl/netmaker/logger"
  13. "github.com/gravitl/netmaker/logic"
  14. "github.com/gravitl/netmaker/models"
  15. "github.com/gravitl/netmaker/netclient/ncutils"
  16. "github.com/gravitl/netmaker/servercfg"
  17. )
  18. // KEEPALIVE_TIMEOUT - time in seconds for timeout
  19. const KEEPALIVE_TIMEOUT = 60 //timeout in seconds
  20. // MQ_DISCONNECT - disconnects MQ
  21. const MQ_DISCONNECT = 250
  22. var peer_force_send = 0
  23. // DefaultHandler default message queue handler - only called when GetDebug == true
  24. func DefaultHandler(client mqtt.Client, msg mqtt.Message) {
  25. logger.Log(0, "MQTT Message: Topic: ", string(msg.Topic()), " Message: ", string(msg.Payload()))
  26. }
  27. // Ping message Handler -- handles ping topic from client nodes
  28. func Ping(client mqtt.Client, msg mqtt.Message) {
  29. logger.Log(0, "Ping Handler: ", msg.Topic())
  30. go func() {
  31. id, err := GetID(msg.Topic())
  32. if err != nil {
  33. logger.Log(0, "error getting node.ID sent on ping topic ")
  34. return
  35. }
  36. node, err := logic.GetNodeByID(id)
  37. if err != nil {
  38. logger.Log(0, "mq-ping error getting node: ", err.Error())
  39. record, err := database.FetchRecord(database.NODES_TABLE_NAME, id)
  40. if err != nil {
  41. logger.Log(0, "error reading database ", err.Error())
  42. return
  43. }
  44. logger.Log(0, "record from database")
  45. logger.Log(0, record)
  46. return
  47. }
  48. _, decryptErr := decryptMsg(&node, msg.Payload())
  49. if decryptErr != nil {
  50. logger.Log(0, "error decrypting when updating node ", node.ID, decryptErr.Error())
  51. return
  52. }
  53. node.SetLastCheckIn()
  54. if err := logic.UpdateNode(&node, &node); err != nil {
  55. logger.Log(0, "error updating node", node.Name, node.ID, " on checkin", err.Error())
  56. return
  57. }
  58. logger.Log(3, "ping processed for node", node.ID)
  59. // --TODO --set client version once feature is implemented.
  60. //node.SetClientVersion(msg.Payload())
  61. }()
  62. }
  63. // UpdateNode message Handler -- handles updates from client nodes
  64. func UpdateNode(client mqtt.Client, msg mqtt.Message) {
  65. go func() {
  66. id, err := GetID(msg.Topic())
  67. if err != nil {
  68. logger.Log(1, "error getting node.ID sent on ", msg.Topic(), err.Error())
  69. return
  70. }
  71. currentNode, err := logic.GetNodeByID(id)
  72. if err != nil {
  73. logger.Log(1, "error getting node ", id, err.Error())
  74. return
  75. }
  76. decrypted, decryptErr := decryptMsg(&currentNode, msg.Payload())
  77. if decryptErr != nil {
  78. logger.Log(1, "failed to decrypt message for node ", id, decryptErr.Error())
  79. return
  80. }
  81. var newNode models.Node
  82. if err := json.Unmarshal(decrypted, &newNode); err != nil {
  83. logger.Log(1, "error unmarshaling payload ", err.Error())
  84. return
  85. }
  86. if err := logic.UpdateNode(&currentNode, &newNode); err != nil {
  87. logger.Log(1, "error saving node", err.Error())
  88. return
  89. }
  90. if err := PublishPeerUpdate(&newNode); err != nil {
  91. logger.Log(1, "error publishing peer update ", err.Error())
  92. return
  93. }
  94. logger.Log(1, "Updated node", id, newNode.Name)
  95. }()
  96. }
  97. // PublishPeerUpdate --- deterines and publishes a peer update to all the peers of a node
  98. func PublishPeerUpdate(newNode *models.Node) error {
  99. if !servercfg.IsMessageQueueBackend() {
  100. return nil
  101. }
  102. networkNodes, err := logic.GetNetworkNodes(newNode.Network)
  103. if err != nil {
  104. logger.Log(1, "err getting Network Nodes", err.Error())
  105. return err
  106. }
  107. for _, node := range networkNodes {
  108. if node.IsServer == "yes" || node.ID == newNode.ID {
  109. continue
  110. }
  111. peerUpdate, err := logic.GetPeerUpdate(&node)
  112. if err != nil {
  113. logger.Log(1, "error getting peer update for node", node.ID, err.Error())
  114. continue
  115. }
  116. data, err := json.Marshal(&peerUpdate)
  117. if err != nil {
  118. logger.Log(2, "error marshaling peer update for node", node.ID, err.Error())
  119. continue
  120. }
  121. if err = publish(&node, fmt.Sprintf("peers/%s/%s", node.Network, node.ID), data); err != nil {
  122. logger.Log(1, "failed to publish peer update for node", node.ID)
  123. } else {
  124. logger.Log(1, "sent peer update for node", node.Name, "on network:", node.Network)
  125. }
  126. }
  127. return nil
  128. }
  129. // PublishPeerUpdate --- deterines and publishes a peer update to all the peers of a node
  130. func PublishExtPeerUpdate(node *models.Node) error {
  131. var err error
  132. if logic.IsLocalServer(node) {
  133. if err = logic.ServerUpdate(node, false); err != nil {
  134. logger.Log(1, "server node:", node.ID, "failed to update peers with ext clients")
  135. return err
  136. } else {
  137. return nil
  138. }
  139. }
  140. if !servercfg.IsMessageQueueBackend() {
  141. return nil
  142. }
  143. peerUpdate, err := logic.GetPeerUpdate(node)
  144. if err != nil {
  145. return err
  146. }
  147. data, err := json.Marshal(&peerUpdate)
  148. if err != nil {
  149. return err
  150. }
  151. return publish(node, fmt.Sprintf("peers/%s/%s", node.Network, node.ID), data)
  152. }
  153. // GetID -- decodes a message queue topic and returns the embedded node.ID
  154. func GetID(topic string) (string, error) {
  155. parts := strings.Split(topic, "/")
  156. count := len(parts)
  157. if count == 1 {
  158. return "", errors.New("invalid topic")
  159. }
  160. //the last part of the topic will be the node.ID
  161. return parts[count-1], nil
  162. }
  163. // NodeUpdate -- publishes a node update
  164. func NodeUpdate(node *models.Node) error {
  165. if !servercfg.IsMessageQueueBackend() {
  166. return nil
  167. }
  168. logger.Log(3, "publishing node update to "+node.Name)
  169. data, err := json.Marshal(node)
  170. if err != nil {
  171. logger.Log(2, "error marshalling node update ", err.Error())
  172. return err
  173. }
  174. if err = publish(node, fmt.Sprintf("update/%s/%s", node.Network, node.ID), data); err != nil {
  175. logger.Log(2, "error publishing node update to peer ", node.ID, err.Error())
  176. return err
  177. }
  178. return nil
  179. }
  180. // SetupMQTT creates a connection to broker and return client
  181. func SetupMQTT(publish bool) mqtt.Client {
  182. opts := mqtt.NewClientOptions()
  183. opts.AddBroker(servercfg.GetMessageQueueEndpoint())
  184. id := ncutils.MakeRandomString(23)
  185. opts.ClientID = id
  186. opts.SetAutoReconnect(true)
  187. opts.SetConnectRetry(true)
  188. opts.SetConnectRetryInterval(time.Second << 2)
  189. opts.SetKeepAlive(time.Minute)
  190. opts.SetWriteTimeout(time.Minute)
  191. opts.SetOnConnectHandler(func(client mqtt.Client) {
  192. if !publish {
  193. if servercfg.GetDebug() {
  194. if token := client.Subscribe("#", 2, mqtt.MessageHandler(DefaultHandler)); token.Wait() && token.Error() != nil {
  195. client.Disconnect(240)
  196. logger.Log(0, "default subscription failed")
  197. }
  198. }
  199. if token := client.Subscribe("ping/#", 2, mqtt.MessageHandler(Ping)); token.Wait() && token.Error() != nil {
  200. client.Disconnect(240)
  201. logger.Log(0, "ping subscription failed")
  202. }
  203. if token := client.Subscribe("update/#", 0, mqtt.MessageHandler(UpdateNode)); token.Wait() && token.Error() != nil {
  204. client.Disconnect(240)
  205. logger.Log(0, "node update subscription failed")
  206. }
  207. opts.SetOrderMatters(true)
  208. opts.SetResumeSubs(true)
  209. }
  210. })
  211. client := mqtt.NewClient(opts)
  212. tperiod := time.Now().Add(10 * time.Second)
  213. for {
  214. if token := client.Connect(); token.Wait() && token.Error() != nil {
  215. logger.Log(2, "unable to connect to broker, retrying ...")
  216. if time.Now().After(tperiod) {
  217. log.Fatal(0, "could not connect to broker, exiting ...", token.Error())
  218. }
  219. } else {
  220. break
  221. }
  222. time.Sleep(2 * time.Second)
  223. }
  224. return client
  225. }
  226. // Keepalive -- periodically pings all nodes to let them know server is still alive and doing well
  227. func Keepalive(ctx context.Context) {
  228. for {
  229. select {
  230. case <-ctx.Done():
  231. return
  232. case <-time.After(time.Second * KEEPALIVE_TIMEOUT):
  233. sendPeers()
  234. }
  235. }
  236. }
  237. // sendPeers - retrieve networks, send peer ports to all peers
  238. func sendPeers() {
  239. var force bool
  240. peer_force_send++
  241. if peer_force_send == 5 {
  242. force = true
  243. peer_force_send = 0
  244. }
  245. networks, err := logic.GetNetworks()
  246. if err != nil {
  247. logger.Log(1, "error retrieving networks for keepalive", err.Error())
  248. }
  249. for _, network := range networks {
  250. serverNode, errN := logic.GetNetworkServerLeader(network.NetID)
  251. if errN == nil {
  252. serverNode.SetLastCheckIn()
  253. logic.UpdateNode(&serverNode, &serverNode)
  254. if network.DefaultUDPHolePunch == "yes" {
  255. if logic.ShouldPublishPeerPorts(&serverNode) || force {
  256. if force {
  257. logger.Log(2, "sending scheduled peer update (5 min)")
  258. }
  259. err = PublishPeerUpdate(&serverNode)
  260. if err != nil {
  261. logger.Log(1, "error publishing udp port updates for network", network.NetID)
  262. logger.Log(1, errN.Error())
  263. }
  264. }
  265. }
  266. } else {
  267. logger.Log(1, "unable to retrieve leader for network ", network.NetID)
  268. logger.Log(1, errN.Error())
  269. continue
  270. }
  271. }
  272. }
  273. // func publishServerKeepalive(client mqtt.Client, network *models.Network) {
  274. // nodes, err := logic.GetNetworkNodes(network.NetID)
  275. // if err != nil {
  276. // return
  277. // }
  278. // for _, node := range nodes {
  279. // if token := client.Publish(fmt.Sprintf("serverkeepalive/%s/%s", network.NetID, node.ID), 0, false, servercfg.GetVersion()); token.Wait() && token.Error() != nil {
  280. // logger.Log(1, "error publishing server keepalive for network", network.NetID, token.Error().Error())
  281. // } else {
  282. // logger.Log(2, "keepalive sent for network/node", network.NetID, node.ID)
  283. // }
  284. // }
  285. // }