mirror of
https://github.com/gravitl/netmaker.git
synced 2025-10-24 21:24:35 +08:00
Merge pull request #1204 from gravitl/feature_v0.14.3_zombies
Feature v0.14.3 zombies
This commit is contained in:
commit
b0a46b8878
3 changed files with 110 additions and 1 deletions
|
@ -213,7 +213,7 @@ func DeleteNodeByID(node *models.Node, exterminate bool) error {
|
|||
// ignoring for now, could hit a nil pointer if delete called twice
|
||||
logger.Log(2, "attempted to remove node ACL for node", node.Name, node.ID)
|
||||
}
|
||||
|
||||
removeZombie <- node.ID
|
||||
return removeLocalServer(node)
|
||||
}
|
||||
|
||||
|
@ -313,6 +313,7 @@ func CreateNode(node *models.Node) error {
|
|||
if err != nil {
|
||||
return err
|
||||
}
|
||||
CheckZombies(node)
|
||||
|
||||
nodebytes, err := json.Marshal(&node)
|
||||
if err != nil {
|
||||
|
|
106
logic/zombie.go
Normal file
106
logic/zombie.go
Normal file
|
@ -0,0 +1,106 @@
|
|||
package logic
|
||||
|
||||
import (
|
||||
"context"
|
||||
"time"
|
||||
|
||||
"github.com/gravitl/netmaker/logger"
|
||||
"github.com/gravitl/netmaker/models"
|
||||
)
|
||||
|
||||
const (
|
||||
// ZOMBIE_TIMEOUT - timeout in seconds for checking zombie status
|
||||
ZOMBIE_TIMEOUT = 60
|
||||
// ZOMBIE_DELETE_TIME - timeout in minutes for zombie node deletion
|
||||
ZOMBIE_DELETE_TIME = 10
|
||||
)
|
||||
|
||||
var (
|
||||
zombies []string
|
||||
removeZombie chan string = make(chan (string))
|
||||
newZombie chan string = make(chan (string))
|
||||
)
|
||||
|
||||
// CheckZombies - checks if new node has same macaddress as existing node
|
||||
// if so, existing node is added to zombie node quarantine list
|
||||
func CheckZombies(newnode *models.Node) {
|
||||
nodes, err := GetNetworkNodes(newnode.Network)
|
||||
if err != nil {
|
||||
logger.Log(1, "Failed to retrieve network nodes", newnode.Network, err.Error())
|
||||
return
|
||||
}
|
||||
for _, node := range nodes {
|
||||
if node.MacAddress == newnode.MacAddress {
|
||||
newZombie <- node.ID
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// ManageZombies - goroutine which adds/removes/deletes nodes from the zombie node quarantine list
|
||||
func ManageZombies(ctx context.Context) {
|
||||
for {
|
||||
select {
|
||||
case <-ctx.Done():
|
||||
return
|
||||
case id := <-newZombie:
|
||||
logger.Log(1, "adding", id, "to zombie quaratine list")
|
||||
zombies = append(zombies, id)
|
||||
case id := <-removeZombie:
|
||||
found := false
|
||||
for i, zombie := range zombies {
|
||||
if zombie == id {
|
||||
logger.Log(1, "removing zombie from quaratine list", zombie)
|
||||
zombies = append(zombies[:i], zombies[i+1:]...)
|
||||
found = true
|
||||
}
|
||||
}
|
||||
if !found {
|
||||
logger.Log(3, "no zombies found")
|
||||
}
|
||||
case <-time.After(time.Second * ZOMBIE_TIMEOUT):
|
||||
for i, zombie := range zombies {
|
||||
node, err := GetNodeByID(zombie)
|
||||
if err != nil {
|
||||
logger.Log(1, "error retrieving zombie node", zombie, err.Error())
|
||||
continue
|
||||
}
|
||||
if time.Since(time.Unix(node.LastCheckIn, 0)) > time.Minute*ZOMBIE_DELETE_TIME {
|
||||
if err := DeleteNodeByID(&node, true); err != nil {
|
||||
logger.Log(1, "error deleting zombie node", zombie, err.Error())
|
||||
continue
|
||||
}
|
||||
logger.Log(1, "deleting zombie node", node.Name)
|
||||
zombies = append(zombies[:i], zombies[i+1:]...)
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// InitializeZombies - populates the zombie quarantine list (should be called from initialization)
|
||||
func InitalizeZombies() {
|
||||
nodes, err := GetAllNodes()
|
||||
if err != nil {
|
||||
logger.Log(1, "failed to retrieve nodes", err.Error())
|
||||
return
|
||||
}
|
||||
for _, node := range nodes {
|
||||
othernodes, err := GetNetworkNodes(node.Network)
|
||||
if err != nil {
|
||||
logger.Log(1, "failled to retrieve nodes for network", node.Network, err.Error())
|
||||
continue
|
||||
}
|
||||
for _, othernode := range othernodes {
|
||||
if node.ID == othernode.ID {
|
||||
continue
|
||||
}
|
||||
if node.MacAddress == othernode.MacAddress {
|
||||
if node.LastCheckIn > othernode.LastCheckIn {
|
||||
zombies = append(zombies, othernode.ID)
|
||||
} else {
|
||||
zombies = append(zombies, node.ID)
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
2
main.go
2
main.go
|
@ -127,6 +127,7 @@ func initialize() { // Client Mode Prereq Check
|
|||
logger.Log(0, "error occurred when notifying nodes of startup", err.Error())
|
||||
}
|
||||
}
|
||||
logic.InitalizeZombies()
|
||||
}
|
||||
|
||||
func startControllers() {
|
||||
|
@ -169,6 +170,7 @@ func runMessageQueue(wg *sync.WaitGroup) {
|
|||
var client = mq.SetupMQTT(false) // Set up the subscription listener
|
||||
ctx, cancel := context.WithCancel(context.Background())
|
||||
go mq.Keepalive(ctx)
|
||||
go logic.ManageZombies(ctx)
|
||||
quit := make(chan os.Signal, 1)
|
||||
signal.Notify(quit, syscall.SIGTERM, os.Interrupt)
|
||||
<-quit
|
||||
|
|
Loading…
Add table
Reference in a new issue