zombie.go 3.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127
  1. package logic
  2. import (
  3. "context"
  4. "net"
  5. "time"
  6. "github.com/google/uuid"
  7. "github.com/gravitl/netmaker/logger"
  8. "github.com/gravitl/netmaker/models"
  9. )
  10. const (
  11. // ZOMBIE_TIMEOUT - timeout in seconds for checking zombie status
  12. ZOMBIE_TIMEOUT = 60
  13. // ZOMBIE_DELETE_TIME - timeout in minutes for zombie node deletion
  14. ZOMBIE_DELETE_TIME = 10
  15. )
  16. var (
  17. zombies []uuid.UUID
  18. removeZombie chan uuid.UUID = make(chan (uuid.UUID), 10)
  19. newZombie chan uuid.UUID = make(chan (uuid.UUID), 10)
  20. )
  21. // CheckZombies - checks if new node has same macaddress as existing node
  22. // if so, existing node is added to zombie node quarantine list
  23. // also cleans up nodes past their expiration date
  24. func CheckZombies(newnode *models.Node, mac net.HardwareAddr) {
  25. nodes, err := GetNetworkNodes(newnode.Network)
  26. if err != nil {
  27. logger.Log(1, "Failed to retrieve network nodes", newnode.Network, err.Error())
  28. return
  29. }
  30. for _, node := range nodes {
  31. if node.ID == newnode.ID {
  32. //skip self
  33. continue
  34. }
  35. if node.HostID == newnode.HostID || time.Now().After(node.ExpirationDateTime) {
  36. logger.Log(0, "adding ", node.ID.String(), " to zombie list")
  37. newZombie <- node.ID
  38. }
  39. }
  40. }
  41. // ManageZombies - goroutine which adds/removes/deletes nodes from the zombie node quarantine list
  42. func ManageZombies(ctx context.Context, peerUpdate chan *models.Node) {
  43. logger.Log(2, "Zombie management started")
  44. InitializeZombies()
  45. for {
  46. select {
  47. case <-ctx.Done():
  48. return
  49. case id := <-newZombie:
  50. logger.Log(1, "adding", id.String(), "to zombie quaratine list")
  51. zombies = append(zombies, id)
  52. case id := <-removeZombie:
  53. found := false
  54. if len(zombies) > 0 {
  55. for i := len(zombies) - 1; i >= 0; i-- {
  56. if zombies[i] == id {
  57. logger.Log(1, "removing zombie from quaratine list", zombies[i].String())
  58. zombies = append(zombies[:i], zombies[i+1:]...)
  59. found = true
  60. }
  61. }
  62. }
  63. if !found {
  64. logger.Log(3, "no zombies found")
  65. }
  66. case <-time.After(time.Second * ZOMBIE_TIMEOUT):
  67. logger.Log(3, "checking for zombie nodes")
  68. if len(zombies) > 0 {
  69. for i := len(zombies) - 1; i >= 0; i-- {
  70. node, err := GetNodeByID(zombies[i].String())
  71. if err != nil {
  72. logger.Log(1, "error retrieving zombie node", zombies[i].String(), err.Error())
  73. logger.Log(1, "deleting ", node.ID.String(), " from zombie list")
  74. zombies = append(zombies[:i], zombies[i+1:]...)
  75. continue
  76. }
  77. if time.Since(node.LastCheckIn) > time.Minute*ZOMBIE_DELETE_TIME || time.Now().After(node.ExpirationDateTime) {
  78. if err := DeleteNode(&node, true); err != nil {
  79. logger.Log(1, "error deleting zombie node", zombies[i].String(), err.Error())
  80. continue
  81. }
  82. node.Action = models.NODE_DELETE
  83. peerUpdate <- &node
  84. logger.Log(1, "deleting zombie node", node.ID.String())
  85. zombies = append(zombies[:i], zombies[i+1:]...)
  86. }
  87. }
  88. }
  89. }
  90. }
  91. }
  92. // InitializeZombies - populates the zombie quarantine list (should be called from initialization)
  93. func InitializeZombies() {
  94. nodes, err := GetAllNodes()
  95. if err != nil {
  96. logger.Log(1, "failed to retrieve nodes", err.Error())
  97. return
  98. }
  99. for _, node := range nodes {
  100. othernodes, err := GetNetworkNodes(node.Network)
  101. if err != nil {
  102. logger.Log(1, "failled to retrieve nodes for network", node.Network, err.Error())
  103. continue
  104. }
  105. for _, othernode := range othernodes {
  106. if node.ID == othernode.ID {
  107. continue
  108. }
  109. if node.HostID == othernode.HostID {
  110. if node.LastCheckIn.After(othernode.LastCheckIn) {
  111. zombies = append(zombies, othernode.ID)
  112. logger.Log(1, "adding", othernode.ID.String(), "to zombie list")
  113. } else {
  114. zombies = append(zombies, node.ID)
  115. logger.Log(1, "adding", node.ID.String(), "to zombie list")
  116. }
  117. }
  118. }
  119. }
  120. }