zombie.go 3.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118
  1. package logic
  2. import (
  3. "context"
  4. "time"
  5. "github.com/gravitl/netmaker/logger"
  6. "github.com/gravitl/netmaker/models"
  7. )
  8. const (
  9. // ZOMBIE_TIMEOUT - timeout in seconds for checking zombie status
  10. ZOMBIE_TIMEOUT = 60
  11. // ZOMBIE_DELETE_TIME - timeout in minutes for zombie node deletion
  12. ZOMBIE_DELETE_TIME = 10
  13. )
  14. var (
  15. zombies []string
  16. removeZombie chan string = make(chan (string), 10)
  17. newZombie chan string = make(chan (string), 10)
  18. )
  19. // CheckZombies - checks if new node has same macaddress as existing node
  20. // if so, existing node is added to zombie node quarantine list
  21. func CheckZombies(newnode *models.Node) {
  22. nodes, err := GetNetworkNodes(newnode.Network)
  23. if err != nil {
  24. logger.Log(1, "Failed to retrieve network nodes", newnode.Network, err.Error())
  25. return
  26. }
  27. for _, node := range nodes {
  28. if node.MacAddress == newnode.MacAddress {
  29. logger.Log(0, "adding ", node.ID, " to zombie list")
  30. newZombie <- node.ID
  31. }
  32. }
  33. }
  34. // ManageZombies - goroutine which adds/removes/deletes nodes from the zombie node quarantine list
  35. func ManageZombies(ctx context.Context) {
  36. logger.Log(2, "Zombie management started")
  37. InitializeZombies()
  38. for {
  39. select {
  40. case <-ctx.Done():
  41. return
  42. case id := <-newZombie:
  43. logger.Log(1, "adding", id, "to zombie quaratine list")
  44. zombies = append(zombies, id)
  45. case id := <-removeZombie:
  46. found := false
  47. if len(zombies) > 0 {
  48. for i := len(zombies) - 1; i >= 0; i-- {
  49. if zombies[i] == id {
  50. logger.Log(1, "removing zombie from quaratine list", zombies[i])
  51. zombies = append(zombies[:i], zombies[i+1:]...)
  52. found = true
  53. }
  54. }
  55. }
  56. if !found {
  57. logger.Log(3, "no zombies found")
  58. }
  59. case <-time.After(time.Second * ZOMBIE_TIMEOUT):
  60. logger.Log(0, "checking for zombie nodes")
  61. if len(zombies) > 0 {
  62. for i := len(zombies) - 1; i >= 0; i-- {
  63. node, err := GetNodeByID(zombies[i])
  64. if err != nil {
  65. logger.Log(1, "error retrieving zombie node", zombies[i], err.Error())
  66. logger.Log(1, "deleting ", node.Name, " from zombie list")
  67. zombies = append(zombies[:i], zombies[i+1:]...)
  68. continue
  69. }
  70. if time.Since(time.Unix(node.LastCheckIn, 0)) > time.Minute*ZOMBIE_DELETE_TIME {
  71. if err := DeleteNodeByID(&node, true); err != nil {
  72. logger.Log(1, "error deleting zombie node", zombies[i], err.Error())
  73. continue
  74. }
  75. logger.Log(1, "deleting zombie node", node.Name)
  76. zombies = append(zombies[:i], zombies[i+1:]...)
  77. }
  78. }
  79. }
  80. }
  81. }
  82. }
  83. // InitializeZombies - populates the zombie quarantine list (should be called from initialization)
  84. func InitializeZombies() {
  85. nodes, err := GetAllNodes()
  86. if err != nil {
  87. logger.Log(1, "failed to retrieve nodes", err.Error())
  88. return
  89. }
  90. for _, node := range nodes {
  91. othernodes, err := GetNetworkNodes(node.Network)
  92. if err != nil {
  93. logger.Log(1, "failled to retrieve nodes for network", node.Network, err.Error())
  94. continue
  95. }
  96. for _, othernode := range othernodes {
  97. if node.ID == othernode.ID {
  98. continue
  99. }
  100. if node.MacAddress == othernode.MacAddress {
  101. if node.LastCheckIn > othernode.LastCheckIn {
  102. zombies = append(zombies, othernode.ID)
  103. logger.Log(1, "adding ", othernode.Name, " with ID ", othernode.ID, " to zombie list")
  104. } else {
  105. zombies = append(zombies, node.ID)
  106. logger.Log(1, "adding ", node.Name, " with ID ", node.ID, " to zombie list")
  107. }
  108. }
  109. }
  110. }
  111. }