zombie.go 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161
  1. package logic
  2. import (
  3. "context"
  4. "time"
  5. "github.com/google/uuid"
  6. "github.com/gravitl/netmaker/logger"
  7. "github.com/gravitl/netmaker/models"
  8. )
  9. const (
  10. // ZOMBIE_TIMEOUT - timeout in seconds for checking zombie status
  11. ZOMBIE_TIMEOUT = 60
  12. // ZOMBIE_DELETE_TIME - timeout in minutes for zombie node deletion
  13. ZOMBIE_DELETE_TIME = 10
  14. )
  15. var (
  16. zombies []uuid.UUID
  17. hostZombies []uuid.UUID
  18. newZombie chan uuid.UUID = make(chan (uuid.UUID), 10)
  19. newHostZombie chan uuid.UUID = make(chan (uuid.UUID), 10)
  20. )
  21. // CheckZombies - checks if new node has same hostid as existing node
  22. // if so, existing node is added to zombie node quarantine list
  23. // also cleans up nodes past their expiration date
  24. func CheckZombies(newnode *models.Node) {
  25. nodes, err := GetNetworkNodes(newnode.Network)
  26. if err != nil {
  27. logger.Log(1, "Failed to retrieve network nodes", newnode.Network, err.Error())
  28. return
  29. }
  30. for _, node := range nodes {
  31. if node.ID == newnode.ID {
  32. //skip self
  33. continue
  34. }
  35. if node.HostID == newnode.HostID || time.Now().After(node.ExpirationDateTime) {
  36. logger.Log(0, "adding ", node.ID.String(), " to zombie list")
  37. newZombie <- node.ID
  38. }
  39. }
  40. }
  41. // checkForZombieHosts - checks if new host has the same macAddress as an existing host
  42. // if true, existing host is added to host zombie collection
  43. func checkForZombieHosts(h *models.Host) {
  44. hosts, err := GetAllHosts()
  45. if err != nil {
  46. logger.Log(3, "errror retrieving all hosts", err.Error())
  47. }
  48. for _, existing := range hosts {
  49. if existing.ID == h.ID {
  50. //probably an unnecessary check as new host should not be in database yet, but just in case
  51. //skip self
  52. continue
  53. }
  54. if existing.MacAddress.String() == h.MacAddress.String() {
  55. //add to hostZombies
  56. newHostZombie <- existing.ID
  57. //add all nodes belonging to host to zombile list
  58. for _, node := range existing.Nodes {
  59. id, err := uuid.Parse(node)
  60. if err != nil {
  61. logger.Log(3, "error parsing uuid from host.Nodes", err.Error())
  62. continue
  63. }
  64. newHostZombie <- id
  65. }
  66. }
  67. }
  68. }
  69. // ManageZombies - goroutine which adds/removes/deletes nodes from the zombie node quarantine list
  70. func ManageZombies(ctx context.Context, peerUpdate chan *models.Node) {
  71. logger.Log(2, "Zombie management started")
  72. InitializeZombies()
  73. for {
  74. select {
  75. case <-ctx.Done():
  76. close(peerUpdate)
  77. return
  78. case id := <-newZombie:
  79. zombies = append(zombies, id)
  80. case id := <-newHostZombie:
  81. hostZombies = append(hostZombies, id)
  82. case <-time.After(time.Second * ZOMBIE_TIMEOUT):
  83. logger.Log(3, "checking for zombie nodes")
  84. if len(zombies) > 0 {
  85. for i := len(zombies) - 1; i >= 0; i-- {
  86. node, err := GetNodeByID(zombies[i].String())
  87. if err != nil {
  88. logger.Log(1, "error retrieving zombie node", zombies[i].String(), err.Error())
  89. logger.Log(1, "deleting ", node.ID.String(), " from zombie list")
  90. zombies = append(zombies[:i], zombies[i+1:]...)
  91. continue
  92. }
  93. if time.Since(node.LastCheckIn) > time.Minute*ZOMBIE_DELETE_TIME || time.Now().After(node.ExpirationDateTime) {
  94. if err := DeleteNode(&node, true); err != nil {
  95. logger.Log(1, "error deleting zombie node", zombies[i].String(), err.Error())
  96. continue
  97. }
  98. node.Action = models.NODE_DELETE
  99. peerUpdate <- &node
  100. logger.Log(1, "deleting zombie node", node.ID.String())
  101. zombies = append(zombies[:i], zombies[i+1:]...)
  102. }
  103. }
  104. }
  105. if len(hostZombies) > 0 {
  106. logger.Log(3, "checking host zombies")
  107. for i := len(hostZombies) - 1; i >= 0; i-- {
  108. host, err := GetHost(hostZombies[i].String())
  109. if err != nil {
  110. logger.Log(1, "error retrieving zombie host", err.Error())
  111. logger.Log(1, "deleting ", host.ID.String(), " from zombie list")
  112. zombies = append(zombies[:i], zombies[i+1:]...)
  113. continue
  114. }
  115. if len(host.Nodes) == 0 {
  116. if err := RemoveHost(host); err != nil {
  117. logger.Log(0, "error deleting zombie host", host.ID.String(), err.Error())
  118. }
  119. }
  120. }
  121. }
  122. }
  123. }
  124. }
  125. // InitializeZombies - populates the zombie quarantine list (should be called from initialization)
  126. func InitializeZombies() {
  127. nodes, err := GetAllNodes()
  128. if err != nil {
  129. logger.Log(1, "failed to retrieve nodes", err.Error())
  130. return
  131. }
  132. for _, node := range nodes {
  133. othernodes, err := GetNetworkNodes(node.Network)
  134. if err != nil {
  135. logger.Log(1, "failled to retrieve nodes for network", node.Network, err.Error())
  136. continue
  137. }
  138. for _, othernode := range othernodes {
  139. if node.ID == othernode.ID {
  140. continue
  141. }
  142. if node.HostID == othernode.HostID {
  143. if node.LastCheckIn.After(othernode.LastCheckIn) {
  144. newZombie <- othernode.ID
  145. logger.Log(1, "adding", othernode.ID.String(), "to zombie list")
  146. } else {
  147. newZombie <- node.ID
  148. logger.Log(1, "adding", node.ID.String(), "to zombie list")
  149. }
  150. }
  151. }
  152. }
  153. }