package functions import ( "context" "crypto/tls" "crypto/x509" "errors" "fmt" "io/ioutil" "log" "os" "os/signal" "strings" "sync" "syscall" "time" mqtt "github.com/eclipse/paho.mqtt.golang" "github.com/go-ping/ping" "github.com/gravitl/netmaker/logger" "github.com/gravitl/netmaker/models" "github.com/gravitl/netmaker/netclient/auth" "github.com/gravitl/netmaker/netclient/config" "github.com/gravitl/netmaker/netclient/daemon" "github.com/gravitl/netmaker/netclient/ncutils" "github.com/gravitl/netmaker/netclient/wireguard" "golang.zx2c4.com/wireguard/wgctrl/wgtypes" ) var messageCache = new(sync.Map) var networkcontext = new(sync.Map) const lastNodeUpdate = "lnu" const lastPeerUpdate = "lpu" type cachedMessage struct { Message string LastSeen time.Time } // Daemon runs netclient daemon from command line func Daemon() error { logger.Log(0, "starting daemon") // == start mq for each server == // == add waitgroup and cancel for checkin routine == ctx, cancel := context.WithCancel(context.Background()) wg := sync.WaitGroup{} networks, _ := ncutils.GetSystemNetworks() for _, network := range networks { //temporary code --- remove in version v0.13.0 removeHostDNS(network, ncutils.IsWindows()) // end of code to be removed in version v0.13.0 var cfg config.ClientConfig cfg.Network = network cfg.ReadConfig() // == initial pull of all networks == initialPull(cfg.Network) logger.Log(1, "started mq for server ", cfg.NetworkSettings.NetID) wg.Add(1) go messageQueue(ctx, wg, &cfg) } wg.Add(1) go Checkin(ctx, &wg) quit := make(chan os.Signal, 1) signal.Notify(quit, syscall.SIGTERM, os.Interrupt, os.Kill) <-quit //for currCommsNet := range commsNetworks { // if cancel, ok := networkcontext.Load(currCommsNet); ok { // cancel.(context.CancelFunc)() // } //} cancel() logger.Log(0, "shutting down netclient daemon") wg.Wait() logger.Log(0, "shutdown complete") return nil } // UpdateKeys -- updates private key and returns new publickey func UpdateKeys(nodeCfg *config.ClientConfig, client mqtt.Client) error { logger.Log(0, "received message to update wireguard keys for network ", nodeCfg.Network) key, err := wgtypes.GeneratePrivateKey() if err != nil { logger.Log(0, "error generating privatekey ", err.Error()) return err } file := ncutils.GetNetclientPathSpecific() + nodeCfg.Node.Interface + ".conf" if err := wireguard.UpdatePrivateKey(file, key.String()); err != nil { logger.Log(0, "error updating wireguard key ", err.Error()) return err } if storeErr := wireguard.StorePrivKey(key.String(), nodeCfg.Network); storeErr != nil { logger.Log(0, "failed to save private key", storeErr.Error()) return storeErr } nodeCfg.Node.PublicKey = key.PublicKey().String() PublishNodeUpdate(nodeCfg) return nil } // PingServer -- checks if server is reachable func PingServer(cfg *config.ClientConfig) error { pinger, err := ping.NewPinger(cfg.Server.ServerName) if err != nil { return err } pinger.Timeout = 2 * time.Second pinger.Run() stats := pinger.Statistics() if stats.PacketLoss == 100 { return errors.New("ping error") } return nil } // == Private == // sets MQ client subscriptions for a specific node config // should be called for each node belonging to a given comms network func setSubscriptions(client mqtt.Client, nodeCfg *config.ClientConfig) { if nodeCfg.DebugOn { if token := client.Subscribe("#", 0, nil); token.Wait() && token.Error() != nil { logger.Log(0, token.Error().Error()) return } logger.Log(0, "subscribed to all topics for debugging purposes") } if token := client.Subscribe(fmt.Sprintf("update/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID), 0, mqtt.MessageHandler(NodeUpdate)); token.Wait() && token.Error() != nil { logger.Log(0, token.Error().Error()) return } logger.Log(2, fmt.Sprintf("subscribed to node updates for node %s update/%s/%s", nodeCfg.Node.Name, nodeCfg.Node.Network, nodeCfg.Node.ID)) if token := client.Subscribe(fmt.Sprintf("peers/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID), 0, mqtt.MessageHandler(UpdatePeers)); token.Wait() && token.Error() != nil { logger.Log(0, token.Error().Error()) return } logger.Log(2, fmt.Sprintf("subscribed to peer updates for node %s peers/%s/%s", nodeCfg.Node.Name, nodeCfg.Node.Network, nodeCfg.Node.ID)) } // on a delete usually, pass in the nodecfg to unsubscribe client broker communications // for the node in nodeCfg func unsubscribeNode(client mqtt.Client, nodeCfg *config.ClientConfig) { client.Unsubscribe(fmt.Sprintf("update/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID)) var ok = true if token := client.Unsubscribe(fmt.Sprintf("update/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID)); token.Wait() && token.Error() != nil { logger.Log(1, "unable to unsubscribe from updates for node ", nodeCfg.Node.Name, "\n", token.Error().Error()) ok = false } if token := client.Unsubscribe(fmt.Sprintf("peers/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID)); token.Wait() && token.Error() != nil { logger.Log(1, "unable to unsubscribe from peer updates for node ", nodeCfg.Node.Name, "\n", token.Error().Error()) ok = false } if ok { logger.Log(1, "successfully unsubscribed node ", nodeCfg.Node.ID, " : ", nodeCfg.Node.Name) } } // sets up Message Queue and subsribes/publishes updates to/from server // the client should subscribe to ALL nodes that exist on server func messageQueue(ctx context.Context, wg sync.WaitGroup, cfg *config.ClientConfig) { //var commsCfg config.ClientConfig //commsCfg.Network = commsNet //commsCfg.ReadConfig() logger.Log(0, "netclient daemon started for server: ", cfg.Server.ServerName) client := setupMQTT(cfg, false) defer client.Disconnect(250) <-ctx.Done() logger.Log(0, "shutting down daemon for server ", cfg.Server.ServerName) wg.Done() } // setupMQTT creates a connection to broker and return client // utilizes comms client configs to setup connections func setupMQTT(cfg *config.ClientConfig, publish bool) mqtt.Client { opts := mqtt.NewClientOptions() opts.AddBroker("ssl://" + cfg.Server.ServerName + ":8883") logger.Log(2, "added broker ", cfg.Server.ServerName) opts.SetDefaultPublishHandler(All) opts.SetAutoReconnect(true) opts.SetConnectRetry(true) opts.SetConnectRetryInterval(time.Second << 2) opts.SetKeepAlive(time.Minute >> 1) opts.SetWriteTimeout(time.Minute) opts.SetOnConnectHandler(func(client mqtt.Client) { logger.Log(0, "Connection Handler") if !publish { networks, err := ncutils.GetSystemNetworks() if err != nil { logger.Log(0, "error retriving networks ", err.Error()) } for _, network := range networks { var currNodeCfg config.ClientConfig currNodeCfg.Network = network currNodeCfg.ReadConfig() setSubscriptions(client, &currNodeCfg) } } }) opts.SetOrderMatters(true) opts.SetResumeSubs(true) opts.SetConnectionLostHandler(func(c mqtt.Client, e error) { logger.Log(0, "detected broker connection lost, running pull for ", cfg.Node.Network) _, err := Pull(cfg.Node.Network, true) if err != nil { logger.Log(0, "could not run pull, server unreachable: ", err.Error()) logger.Log(0, "waiting to retry...") } logger.Log(0, "connection re-established with mqtt server") }) opts.SetTLSConfig(NewTLSConfig(cfg)) logger.Log(0, "Calling NewClient") client := mqtt.NewClient(opts) tperiod := time.Now().Add(12 * time.Second) for { //if after 12 seconds, try a gRPC pull on the last try if time.Now().After(tperiod) { logger.Log(0, "running pull for ", cfg.Node.Network) _, err := Pull(cfg.Node.Network, true) if err != nil { logger.Log(0, "could not run pull, exiting ", cfg.Node.Network, " setup: ", err.Error()) return client } time.Sleep(time.Second) } if token := client.Connect(); token.Wait() && token.Error() != nil { logger.Log(0, token.Error().Error()) logger.Log(0, "unable to connect to broker, retrying ...") if time.Now().After(tperiod) { logger.Log(0, "could not connect to broker, exiting ", cfg.Node.Network, " setup: ", token.Error().Error()) if strings.Contains(token.Error().Error(), "connectex") || strings.Contains(token.Error().Error(), "i/o timeout") { logger.Log(0, "connection issue detected.. pulling and restarting daemon") Pull(cfg.Node.Network, true) daemon.Restart() } return client } } else { break } time.Sleep(2 * time.Second) } logger.Log(0, "MQ setup "+cfg.NetworkSettings.NetID) return client } // NewTLSConf sets up tls to connect to broker func NewTLSConfig(cfg *config.ClientConfig) *tls.Config { certpool := x509.NewCertPool() ca, err := ioutil.ReadFile("/etc/netclient/" + cfg.NetworkSettings.NetID + "-ca.pem") if err != nil { log.Fatalf("could not read CA file %v\n", err) } certpool.AppendCertsFromPEM(ca) clientKeyPair, err := tls.LoadX509KeyPair("/etc/netclient/"+cfg.NetworkSettings.NetID+"-client.pem", "/etc/netclient/client.key") if err != nil { log.Fatalf("could not read client cert/key %v \n", err) } return &tls.Config{ RootCAs: certpool, //ClientAuth: tls.NoClientCert, ClientAuth: tls.VerifyClientCertIfGiven, ClientCAs: nil, InsecureSkipVerify: true, Certificates: []tls.Certificate{clientKeyPair}, } } // publishes a message to server to update peers on this peer's behalf func publishSignal(nodeCfg *config.ClientConfig, signal string) error { if err := publish(nodeCfg, fmt.Sprintf("signal/%s", nodeCfg.Node.ID), []byte(signal), 1); err != nil { return err } return nil } func initialPull(network string) { logger.Log(0, "pulling latest config for ", network) var configPath = fmt.Sprintf("%snetconfig-%s", ncutils.GetNetclientPathSpecific(), network) fileInfo, err := os.Stat(configPath) if err != nil { logger.Log(0, "could not stat config file: ", configPath) return } // speed up UDP rest if !fileInfo.ModTime().IsZero() && time.Now().After(fileInfo.ModTime().Add(time.Minute)) { sleepTime := 2 for { _, err := Pull(network, true) if err == nil { break } if sleepTime > 3600 { sleepTime = 3600 } logger.Log(0, "failed to pull for network ", network) logger.Log(0, fmt.Sprintf("waiting %d seconds to retry...", sleepTime)) time.Sleep(time.Second * time.Duration(sleepTime)) sleepTime = sleepTime * 2 } time.Sleep(time.Second << 1) } } func parseNetworkFromTopic(topic string) string { return strings.Split(topic, "/")[1] } // should only ever use node client configs func decryptMsg(nodeCfg *config.ClientConfig, msg []byte) ([]byte, error) { if len(msg) <= 24 { // make sure message is of appropriate length return nil, fmt.Errorf("recieved invalid message from broker %v", msg) } // setup the keys diskKey, keyErr := auth.RetrieveTrafficKey(nodeCfg.Node.Network) if keyErr != nil { return nil, keyErr } serverPubKey, err := ncutils.ConvertBytesToKey(nodeCfg.Node.TrafficKeys.Server) if err != nil { return nil, err } return ncutils.DeChunk(msg, serverPubKey, diskKey) } func getServerAddress(cfg *config.ClientConfig) string { var server models.ServerAddr for _, server = range cfg.Node.NetworkSettings.DefaultServerAddrs { if server.Address != "" && server.IsLeader { break } } return server.Address } func getServers(networks []string) (map[string]bool, error) { var cfg config.ClientConfig var response = make(map[string]bool, 1) for _, network := range networks { cfg.Network = network cfg.ReadConfig() response[cfg.Server.ServerName] = true } return response, nil } func getCommsNetworks(networks []string) (map[string]bool, error) { var cfg config.ClientConfig var response = make(map[string]bool, 1) for _, network := range networks { cfg.Network = network cfg.ReadConfig() response[cfg.Node.CommID] = true } return response, nil } func getCommsCfgByNode(node *models.Node) config.ClientConfig { var commsCfg config.ClientConfig commsCfg.Network = node.CommID commsCfg.ReadConfig() return commsCfg } // == Message Caches == func insert(network, which, cache string) { var newMessage = cachedMessage{ Message: cache, LastSeen: time.Now(), } messageCache.Store(fmt.Sprintf("%s%s", network, which), newMessage) } func read(network, which string) string { val, isok := messageCache.Load(fmt.Sprintf("%s%s", network, which)) if isok { var readMessage = val.(cachedMessage) // fetch current cached message if readMessage.LastSeen.IsZero() { return "" } if time.Now().After(readMessage.LastSeen.Add(time.Minute * 10)) { // check if message has been there over a minute messageCache.Delete(fmt.Sprintf("%s%s", network, which)) // remove old message if expired return "" } return readMessage.Message // return current message if not expired } return "" } // == End Message Caches ==