handlers.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400
  1. package mq
  2. import (
  3. "encoding/json"
  4. "fmt"
  5. "time"
  6. mqtt "github.com/eclipse/paho.mqtt.golang"
  7. "github.com/gravitl/netmaker/database"
  8. "github.com/gravitl/netmaker/logger"
  9. "github.com/gravitl/netmaker/logic"
  10. "github.com/gravitl/netmaker/models"
  11. "github.com/gravitl/netmaker/netclient/ncutils"
  12. "github.com/gravitl/netmaker/servercfg"
  13. )
  14. // DefaultHandler default message queue handler -- NOT USED
  15. func DefaultHandler(client mqtt.Client, msg mqtt.Message) {
  16. logger.Log(0, "MQTT Message: Topic: ", string(msg.Topic()), " Message: ", string(msg.Payload()))
  17. }
  18. // Ping message Handler -- handles ping topic from client nodes
  19. func Ping(client mqtt.Client, msg mqtt.Message) {
  20. go func() {
  21. id, err := getID(msg.Topic())
  22. if err != nil {
  23. logger.Log(0, "error getting node.ID sent on ping topic ")
  24. return
  25. }
  26. node, err := logic.GetNodeByID(id)
  27. if err != nil {
  28. logger.Log(0, "mq-ping error getting node: ", err.Error())
  29. record, err := database.FetchRecord(database.NODES_TABLE_NAME, id)
  30. if err != nil {
  31. logger.Log(0, "error reading database ", err.Error())
  32. return
  33. }
  34. logger.Log(0, "record from database")
  35. logger.Log(0, record)
  36. return
  37. }
  38. decrypted, decryptErr := decryptMsg(&node, msg.Payload())
  39. if decryptErr != nil {
  40. logger.Log(0, "error decrypting when updating node ", node.ID.String(), decryptErr.Error())
  41. return
  42. }
  43. var checkin models.NodeCheckin
  44. if err := json.Unmarshal(decrypted, &checkin); err != nil {
  45. logger.Log(1, "error unmarshaling payload ", err.Error())
  46. return
  47. }
  48. host, err := logic.GetHost(node.HostID.String())
  49. if err != nil {
  50. logger.Log(0, "error retrieving host for node ", node.ID.String(), err.Error())
  51. return
  52. }
  53. node.SetLastCheckIn()
  54. host.Version = checkin.Version
  55. node.Connected = checkin.Connected
  56. host.Interfaces = checkin.Ifaces
  57. for i := range host.Interfaces {
  58. host.Interfaces[i].AddressString = host.Interfaces[i].Address.String()
  59. }
  60. if err := logic.UpdateNode(&node, &node); err != nil {
  61. logger.Log(0, "error updating node", node.ID.String(), " on checkin", err.Error())
  62. return
  63. }
  64. logger.Log(3, "ping processed for node", node.ID.String())
  65. // --TODO --set client version once feature is implemented.
  66. //node.SetClientVersion(msg.Payload())
  67. }()
  68. }
  69. // UpdateNode message Handler -- handles updates from client nodes
  70. func UpdateNode(client mqtt.Client, msg mqtt.Message) {
  71. go func() {
  72. id, err := getID(msg.Topic())
  73. if err != nil {
  74. logger.Log(1, "error getting node.ID sent on ", msg.Topic(), err.Error())
  75. return
  76. }
  77. currentNode, err := logic.GetNodeByID(id)
  78. if err != nil {
  79. logger.Log(1, "error getting node ", id, err.Error())
  80. return
  81. }
  82. decrypted, decryptErr := decryptMsg(&currentNode, msg.Payload())
  83. if decryptErr != nil {
  84. logger.Log(1, "failed to decrypt message for node ", id, decryptErr.Error())
  85. return
  86. }
  87. var newNode models.Node
  88. if err := json.Unmarshal(decrypted, &newNode); err != nil {
  89. logger.Log(1, "error unmarshaling payload ", err.Error())
  90. return
  91. }
  92. ifaceDelta := logic.IfaceDelta(&currentNode, &newNode)
  93. if servercfg.Is_EE && ifaceDelta {
  94. if err = logic.EnterpriseResetAllPeersFailovers(currentNode.ID, currentNode.Network); err != nil {
  95. logger.Log(1, "failed to reset failover list during node update", currentNode.ID.String(), currentNode.Network)
  96. }
  97. }
  98. newNode.SetLastCheckIn()
  99. if err := logic.UpdateNode(&currentNode, &newNode); err != nil {
  100. logger.Log(1, "error saving node", err.Error())
  101. return
  102. }
  103. if ifaceDelta { // reduce number of unneeded updates, by only sending on iface changes
  104. if err = PublishPeerUpdate(); err != nil {
  105. logger.Log(0, "error updating peers when node", currentNode.ID.String(), "informed the server of an interface change", err.Error())
  106. }
  107. }
  108. logger.Log(1, "updated node", id, newNode.ID.String())
  109. }()
  110. }
  111. // UpdateHost message Handler -- handles host updates from clients
  112. func UpdateHost(client mqtt.Client, msg mqtt.Message) {
  113. go func(msg mqtt.Message) {
  114. id, err := getID(msg.Topic())
  115. if err != nil {
  116. logger.Log(1, "error getting host.ID sent on ", msg.Topic(), err.Error())
  117. return
  118. }
  119. currentHost, err := logic.GetHost(id)
  120. if err != nil {
  121. logger.Log(1, "error getting host ", id, err.Error())
  122. return
  123. }
  124. decrypted, decryptErr := decryptMsgWithHost(currentHost, msg.Payload())
  125. if decryptErr != nil {
  126. logger.Log(1, "failed to decrypt message for host ", id, decryptErr.Error())
  127. return
  128. }
  129. var hostUpdate models.HostUpdate
  130. if err := json.Unmarshal(decrypted, &hostUpdate); err != nil {
  131. logger.Log(1, "error unmarshaling payload ", err.Error())
  132. return
  133. }
  134. logger.Log(3, fmt.Sprintf("recieved host update: %+v\n", hostUpdate))
  135. var sendPeerUpdate bool
  136. switch hostUpdate.Action {
  137. case models.UpdateHost:
  138. sendPeerUpdate = updateHostFromClient(&hostUpdate.Host, currentHost)
  139. err := logic.UpsertHost(currentHost)
  140. if err != nil {
  141. logger.Log(0, "failed to update host: ", currentHost.ID.String(), err.Error())
  142. return
  143. }
  144. case models.DeleteHost:
  145. if err := logic.DisassociateAllNodesFromHost(currentHost.ID.String()); err != nil {
  146. logger.Log(0, "failed to delete all nodes of host: ", currentHost.ID.String(), err.Error())
  147. return
  148. }
  149. if err := logic.RemoveHostByID(currentHost.ID.String()); err != nil {
  150. logger.Log(0, "failed to delete host: ", currentHost.ID.String(), err.Error())
  151. return
  152. }
  153. sendPeerUpdate = true
  154. }
  155. if sendPeerUpdate {
  156. err := PublishPeerUpdate()
  157. if err != nil {
  158. logger.Log(0, "failed to pulish peer update: ", err.Error())
  159. }
  160. }
  161. if sendPeerUpdate {
  162. err := PublishPeerUpdate()
  163. if err != nil {
  164. logger.Log(0, "failed to pulish peer update: ", err.Error())
  165. }
  166. }
  167. // if servercfg.Is_EE && ifaceDelta {
  168. // if err = logic.EnterpriseResetAllPeersFailovers(currentHost.ID.String(), currentHost.Network); err != nil {
  169. // logger.Log(1, "failed to reset failover list during node update", currentHost.ID.String(), currentHost.Network)
  170. // }
  171. // }
  172. }(msg)
  173. }
  174. // used for updating host on server with update recieved from client
  175. func updateHostFromClient(newHost, currHost *models.Host) (sendPeerUpdate bool) {
  176. if newHost.ListenPort != 0 && currHost.ListenPort != newHost.ListenPort {
  177. currHost.ListenPort = newHost.ListenPort
  178. sendPeerUpdate = true
  179. }
  180. if newHost.ProxyListenPort != 0 && currHost.ProxyListenPort != newHost.ProxyListenPort {
  181. currHost.ProxyListenPort = newHost.ProxyListenPort
  182. sendPeerUpdate = true
  183. }
  184. if newHost.PublicListenPort != 0 && currHost.PublicListenPort != newHost.PublicListenPort {
  185. currHost.PublicListenPort = newHost.PublicListenPort
  186. sendPeerUpdate = true
  187. }
  188. if currHost.ProxyEnabled != newHost.ProxyEnabled {
  189. currHost.ProxyEnabled = newHost.ProxyEnabled
  190. sendPeerUpdate = true
  191. }
  192. if currHost.EndpointIP.String() != newHost.EndpointIP.String() {
  193. currHost.EndpointIP = newHost.EndpointIP
  194. sendPeerUpdate = true
  195. }
  196. currHost.DaemonInstalled = newHost.DaemonInstalled
  197. currHost.Debug = newHost.Debug
  198. currHost.Verbosity = newHost.Verbosity
  199. currHost.Version = newHost.Version
  200. currHost.Name = newHost.Name
  201. return
  202. }
  203. // UpdateMetrics message Handler -- handles updates from client nodes for metrics
  204. func UpdateMetrics(client mqtt.Client, msg mqtt.Message) {
  205. if servercfg.Is_EE {
  206. go func() {
  207. id, err := getID(msg.Topic())
  208. if err != nil {
  209. logger.Log(1, "error getting node.ID sent on ", msg.Topic(), err.Error())
  210. return
  211. }
  212. currentNode, err := logic.GetNodeByID(id)
  213. if err != nil {
  214. logger.Log(1, "error getting node ", id, err.Error())
  215. return
  216. }
  217. decrypted, decryptErr := decryptMsg(&currentNode, msg.Payload())
  218. if decryptErr != nil {
  219. logger.Log(1, "failed to decrypt message for node ", id, decryptErr.Error())
  220. return
  221. }
  222. var newMetrics models.Metrics
  223. if err := json.Unmarshal(decrypted, &newMetrics); err != nil {
  224. logger.Log(1, "error unmarshaling payload ", err.Error())
  225. return
  226. }
  227. shouldUpdate := updateNodeMetrics(&currentNode, &newMetrics)
  228. if err = logic.UpdateMetrics(id, &newMetrics); err != nil {
  229. logger.Log(1, "faield to update node metrics", id, err.Error())
  230. return
  231. }
  232. if servercfg.IsMetricsExporter() {
  233. if err := pushMetricsToExporter(newMetrics); err != nil {
  234. logger.Log(2, fmt.Sprintf("failed to push node: [%s] metrics to exporter, err: %v",
  235. currentNode.ID, err))
  236. }
  237. }
  238. if newMetrics.Connectivity != nil {
  239. err := logic.EnterpriseFailoverFunc(&currentNode)
  240. if err != nil {
  241. logger.Log(0, "failed to failover for node", currentNode.ID.String(), "on network", currentNode.Network, "-", err.Error())
  242. }
  243. }
  244. if shouldUpdate {
  245. logger.Log(2, "updating peers after node", currentNode.ID.String(), currentNode.Network, "detected connectivity issues")
  246. host, err := logic.GetHost(currentNode.HostID.String())
  247. if err == nil {
  248. if err = PublishSingleHostUpdate(host); err != nil {
  249. logger.Log(0, "failed to publish update after failover peer change for node", currentNode.ID.String(), currentNode.Network)
  250. }
  251. }
  252. }
  253. logger.Log(1, "updated node metrics", id)
  254. }()
  255. }
  256. }
  257. // ClientPeerUpdate message handler -- handles updating peers after signal from client nodes
  258. func ClientPeerUpdate(client mqtt.Client, msg mqtt.Message) {
  259. go func() {
  260. id, err := getID(msg.Topic())
  261. if err != nil {
  262. logger.Log(1, "error getting node.ID sent on ", msg.Topic(), err.Error())
  263. return
  264. }
  265. currentNode, err := logic.GetNodeByID(id)
  266. if err != nil {
  267. logger.Log(1, "error getting node ", id, err.Error())
  268. return
  269. }
  270. decrypted, decryptErr := decryptMsg(&currentNode, msg.Payload())
  271. if decryptErr != nil {
  272. logger.Log(1, "failed to decrypt message during client peer update for node ", id, decryptErr.Error())
  273. return
  274. }
  275. switch decrypted[0] {
  276. case ncutils.ACK:
  277. //do we still need this
  278. case ncutils.DONE:
  279. updateNodePeers(&currentNode)
  280. }
  281. logger.Log(1, "sent peer updates after signal received from", id)
  282. }()
  283. }
  284. func updateNodePeers(currentNode *models.Node) {
  285. if err := PublishPeerUpdate(); err != nil {
  286. logger.Log(1, "error publishing peer update ", err.Error())
  287. return
  288. }
  289. }
  290. func updateNodeMetrics(currentNode *models.Node, newMetrics *models.Metrics) bool {
  291. if newMetrics.FailoverPeers == nil {
  292. newMetrics.FailoverPeers = make(map[string]string)
  293. }
  294. oldMetrics, err := logic.GetMetrics(currentNode.ID.String())
  295. if err != nil {
  296. logger.Log(1, "error finding old metrics for node", currentNode.ID.String())
  297. return false
  298. }
  299. if oldMetrics.FailoverPeers == nil {
  300. oldMetrics.FailoverPeers = make(map[string]string)
  301. }
  302. var attachedClients []models.ExtClient
  303. if currentNode.IsIngressGateway {
  304. clients, err := logic.GetExtClientsByID(currentNode.ID.String(), currentNode.Network)
  305. if err == nil {
  306. attachedClients = clients
  307. }
  308. }
  309. if len(attachedClients) > 0 {
  310. // associate ext clients with IDs
  311. for i := range attachedClients {
  312. extMetric := newMetrics.Connectivity[attachedClients[i].PublicKey]
  313. if len(extMetric.NodeName) == 0 &&
  314. len(newMetrics.Connectivity[attachedClients[i].ClientID].NodeName) > 0 { // cover server clients
  315. extMetric = newMetrics.Connectivity[attachedClients[i].ClientID]
  316. if extMetric.TotalReceived > 0 && extMetric.TotalSent > 0 {
  317. extMetric.Connected = true
  318. }
  319. }
  320. extMetric.NodeName = attachedClients[i].ClientID
  321. delete(newMetrics.Connectivity, attachedClients[i].PublicKey)
  322. newMetrics.Connectivity[attachedClients[i].ClientID] = extMetric
  323. }
  324. }
  325. // run through metrics for each peer
  326. for k := range newMetrics.Connectivity {
  327. currMetric := newMetrics.Connectivity[k]
  328. oldMetric := oldMetrics.Connectivity[k]
  329. currMetric.TotalTime += oldMetric.TotalTime
  330. currMetric.Uptime += oldMetric.Uptime // get the total uptime for this connection
  331. if currMetric.Uptime == 0 || currMetric.TotalTime == 0 {
  332. currMetric.PercentUp = 0
  333. } else {
  334. currMetric.PercentUp = 100.0 * (float64(currMetric.Uptime) / float64(currMetric.TotalTime))
  335. }
  336. totalUpMinutes := currMetric.Uptime * ncutils.CheckInInterval
  337. currMetric.ActualUptime = time.Duration(totalUpMinutes) * time.Minute
  338. delete(oldMetrics.Connectivity, k) // remove from old data
  339. newMetrics.Connectivity[k] = currMetric
  340. }
  341. // add nodes that need failover
  342. nodes, err := logic.GetNetworkNodes(currentNode.Network)
  343. if err != nil {
  344. logger.Log(0, "failed to retrieve nodes while updating metrics")
  345. return false
  346. }
  347. for _, node := range nodes {
  348. if !newMetrics.Connectivity[node.ID.String()].Connected &&
  349. len(newMetrics.Connectivity[node.ID.String()].NodeName) > 0 &&
  350. node.Connected &&
  351. len(node.FailoverNode) > 0 &&
  352. !node.Failover {
  353. newMetrics.FailoverPeers[node.ID.String()] = node.FailoverNode.String()
  354. }
  355. }
  356. shouldUpdate := len(oldMetrics.FailoverPeers) == 0 && len(newMetrics.FailoverPeers) > 0
  357. for k, v := range oldMetrics.FailoverPeers {
  358. if len(newMetrics.FailoverPeers[k]) > 0 && len(v) == 0 {
  359. shouldUpdate = true
  360. }
  361. if len(v) > 0 && len(newMetrics.FailoverPeers[k]) == 0 {
  362. newMetrics.FailoverPeers[k] = v
  363. }
  364. }
  365. for k := range oldMetrics.Connectivity { // cleanup any left over data, self healing
  366. delete(newMetrics.Connectivity, k)
  367. }
  368. return shouldUpdate
  369. }