daemon.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350
  1. package functions
  2. import (
  3. "context"
  4. "errors"
  5. "fmt"
  6. "os"
  7. "os/signal"
  8. "strings"
  9. "sync"
  10. "syscall"
  11. "time"
  12. mqtt "github.com/eclipse/paho.mqtt.golang"
  13. "github.com/gravitl/netmaker/logger"
  14. "github.com/gravitl/netmaker/mq"
  15. "github.com/gravitl/netmaker/netclient/auth"
  16. "github.com/gravitl/netmaker/netclient/config"
  17. "github.com/gravitl/netmaker/netclient/global_settings"
  18. "github.com/gravitl/netmaker/netclient/local"
  19. "github.com/gravitl/netmaker/netclient/ncutils"
  20. "github.com/gravitl/netmaker/netclient/wireguard"
  21. "golang.zx2c4.com/wireguard/wgctrl/wgtypes"
  22. )
  23. var messageCache = new(sync.Map)
  24. var serverSet map[string]bool
  25. var mqclient mqtt.Client
  26. const lastNodeUpdate = "lnu"
  27. const lastPeerUpdate = "lpu"
  28. type cachedMessage struct {
  29. Message string
  30. LastSeen time.Time
  31. }
  32. // Daemon runs netclient daemon from command line
  33. func Daemon() error {
  34. logger.Log(0, "netclient daemon started -- version:", ncutils.Version)
  35. UpdateClientConfig()
  36. if err := ncutils.SavePID(); err != nil {
  37. return err
  38. }
  39. // reference required to eliminate unused statticcheck
  40. serverSet = make(map[string]bool)
  41. serverSet["dummy"] = false
  42. // set ipforwarding on startup
  43. err := local.SetIPForwarding()
  44. if err != nil {
  45. logger.Log(0, err.Error())
  46. }
  47. // == add waitgroup and cancel for checkin routine ==
  48. wg := sync.WaitGroup{}
  49. quit := make(chan os.Signal, 1)
  50. reset := make(chan os.Signal, 1)
  51. signal.Notify(quit, syscall.SIGTERM, os.Interrupt)
  52. signal.Notify(reset, syscall.SIGHUP)
  53. cancel := startGoRoutines(&wg)
  54. for {
  55. select {
  56. case <-quit:
  57. cancel()
  58. logger.Log(0, "shutting down netclient daemon")
  59. wg.Wait()
  60. if mqclient != nil {
  61. mqclient.Disconnect(250)
  62. }
  63. logger.Log(0, "shutdown complete")
  64. return nil
  65. case <-reset:
  66. logger.Log(0, "received reset")
  67. cancel()
  68. wg.Wait()
  69. if mqclient != nil {
  70. mqclient.Disconnect(250)
  71. }
  72. logger.Log(0, "restarting daemon")
  73. cancel = startGoRoutines(&wg)
  74. }
  75. }
  76. }
  77. func startGoRoutines(wg *sync.WaitGroup) context.CancelFunc {
  78. ctx, cancel := context.WithCancel(context.Background())
  79. serverSet := make(map[string]bool)
  80. networks, _ := ncutils.GetSystemNetworks()
  81. for _, network := range networks {
  82. logger.Log(3, "initializing network", network)
  83. cfg := config.ClientConfig{}
  84. cfg.Network = network
  85. cfg.ReadConfig()
  86. if cfg.Node.Connected == "yes" {
  87. if err := wireguard.ApplyConf(&cfg.Node, cfg.Node.Interface, ncutils.GetNetclientPathSpecific()+cfg.Node.Interface+".conf"); err != nil {
  88. logger.Log(0, "failed to start ", cfg.Node.Interface, "wg interface", err.Error())
  89. }
  90. if cfg.PublicIPService != "" {
  91. global_settings.PublicIPServices[network] = cfg.PublicIPService
  92. }
  93. }
  94. server := cfg.Server.Server
  95. if !serverSet[server] {
  96. // == subscribe to all nodes for each on machine ==
  97. serverSet[server] = true
  98. logger.Log(1, "started daemon for server ", server)
  99. local.SetNetmakerDomainRoute(cfg.Server.API)
  100. wg.Add(1)
  101. go messageQueue(ctx, wg, &cfg)
  102. }
  103. }
  104. wg.Add(1)
  105. go Checkin(ctx, wg)
  106. return cancel
  107. }
  108. // UpdateKeys -- updates private key and returns new publickey
  109. func UpdateKeys(nodeCfg *config.ClientConfig, client mqtt.Client) error {
  110. logger.Log(0, "interface:", nodeCfg.Node.Interface, "received message to update wireguard keys for network ", nodeCfg.Network)
  111. key, err := wgtypes.GeneratePrivateKey()
  112. if err != nil {
  113. logger.Log(0, "network:", nodeCfg.Node.Network, "error generating privatekey ", err.Error())
  114. return err
  115. }
  116. file := ncutils.GetNetclientPathSpecific() + nodeCfg.Node.Interface + ".conf"
  117. if err := wireguard.UpdatePrivateKey(file, key.String()); err != nil {
  118. logger.Log(0, "network:", nodeCfg.Node.Network, "error updating wireguard key ", err.Error())
  119. return err
  120. }
  121. if storeErr := wireguard.StorePrivKey(key.String(), nodeCfg.Network); storeErr != nil {
  122. logger.Log(0, "network:", nodeCfg.Network, "failed to save private key", storeErr.Error())
  123. return storeErr
  124. }
  125. nodeCfg.Node.PublicKey = key.PublicKey().String()
  126. PublishNodeUpdate(nodeCfg)
  127. return nil
  128. }
  129. // == Private ==
  130. // sets MQ client subscriptions for a specific node config
  131. // should be called for each node belonging to a given server
  132. func setSubscriptions(client mqtt.Client, nodeCfg *config.ClientConfig) {
  133. if token := client.Subscribe(fmt.Sprintf("update/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID), 0, mqtt.MessageHandler(NodeUpdate)); token.WaitTimeout(mq.MQ_TIMEOUT*time.Second) && token.Error() != nil {
  134. if token.Error() == nil {
  135. logger.Log(0, "network:", nodeCfg.Node.Network, "connection timeout")
  136. } else {
  137. logger.Log(0, "network:", nodeCfg.Node.Network, token.Error().Error())
  138. }
  139. return
  140. }
  141. logger.Log(3, fmt.Sprintf("subscribed to node updates for node %s update/%s/%s", nodeCfg.Node.Name, nodeCfg.Node.Network, nodeCfg.Node.ID))
  142. if token := client.Subscribe(fmt.Sprintf("peers/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID), 0, mqtt.MessageHandler(UpdatePeers)); token.Wait() && token.Error() != nil {
  143. logger.Log(0, "network", nodeCfg.Node.Network, token.Error().Error())
  144. return
  145. }
  146. logger.Log(3, fmt.Sprintf("subscribed to peer updates for node %s peers/%s/%s", nodeCfg.Node.Name, nodeCfg.Node.Network, nodeCfg.Node.ID))
  147. }
  148. // on a delete usually, pass in the nodecfg to unsubscribe client broker communications
  149. // for the node in nodeCfg
  150. func unsubscribeNode(client mqtt.Client, nodeCfg *config.ClientConfig) {
  151. client.Unsubscribe(fmt.Sprintf("update/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID))
  152. var ok = true
  153. if token := client.Unsubscribe(fmt.Sprintf("update/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID)); token.WaitTimeout(mq.MQ_TIMEOUT*time.Second) && token.Error() != nil {
  154. if token.Error() == nil {
  155. logger.Log(1, "network:", nodeCfg.Node.Network, "unable to unsubscribe from updates for node ", nodeCfg.Node.Name, "\n", "connection timeout")
  156. } else {
  157. logger.Log(1, "network:", nodeCfg.Node.Network, "unable to unsubscribe from updates for node ", nodeCfg.Node.Name, "\n", token.Error().Error())
  158. }
  159. ok = false
  160. }
  161. if token := client.Unsubscribe(fmt.Sprintf("peers/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID)); token.WaitTimeout(mq.MQ_TIMEOUT*time.Second) && token.Error() != nil {
  162. if token.Error() == nil {
  163. logger.Log(1, "network:", nodeCfg.Node.Network, "unable to unsubscribe from peer updates for node", nodeCfg.Node.Name, "\n", "connection timeout")
  164. } else {
  165. logger.Log(1, "network:", nodeCfg.Node.Network, "unable to unsubscribe from peer updates for node", nodeCfg.Node.Name, "\n", token.Error().Error())
  166. }
  167. ok = false
  168. }
  169. if ok {
  170. logger.Log(1, "network:", nodeCfg.Node.Network, "successfully unsubscribed node ", nodeCfg.Node.ID, " : ", nodeCfg.Node.Name)
  171. }
  172. }
  173. // sets up Message Queue and subsribes/publishes updates to/from server
  174. // the client should subscribe to ALL nodes that exist on server locally
  175. func messageQueue(ctx context.Context, wg *sync.WaitGroup, cfg *config.ClientConfig) {
  176. defer wg.Done()
  177. logger.Log(0, "network:", cfg.Node.Network, "netclient message queue started for server:", cfg.Server.Server)
  178. err := setupMQTT(cfg)
  179. if err != nil {
  180. logger.Log(0, "unable to connect to broker", cfg.Server.Server, err.Error())
  181. return
  182. }
  183. //defer mqclient.Disconnect(250)
  184. <-ctx.Done()
  185. logger.Log(0, "shutting down message queue for server", cfg.Server.Server)
  186. }
  187. // func setMQTTSingenton creates a connection to broker for single use (ie to publish a message)
  188. // only to be called from cli (eg. connect/disconnect, join, leave) and not from daemon ---
  189. func setupMQTTSingleton(cfg *config.ClientConfig) error {
  190. opts := mqtt.NewClientOptions()
  191. server := cfg.Server.Server
  192. port := cfg.Server.MQPort
  193. pass, err := os.ReadFile(ncutils.GetNetclientPathSpecific() + "secret-" + cfg.Network)
  194. if err != nil {
  195. return fmt.Errorf("could not read secrets file %w", err)
  196. }
  197. opts.AddBroker("mqtts://" + server + ":" + port)
  198. opts.SetUsername(cfg.Node.ID)
  199. opts.SetPassword(string(pass))
  200. mqclient = mqtt.NewClient(opts)
  201. var connecterr error
  202. opts.SetClientID(ncutils.MakeRandomString(23))
  203. if token := mqclient.Connect(); !token.WaitTimeout(30*time.Second) || token.Error() != nil {
  204. logger.Log(0, "unable to connect to broker, retrying ...")
  205. if token.Error() == nil {
  206. connecterr = errors.New("connect timeout")
  207. } else {
  208. connecterr = token.Error()
  209. }
  210. }
  211. return connecterr
  212. }
  213. // setupMQTT creates a connection to broker and returns client
  214. // this function is primarily used to create a connection to publish to the broker
  215. func setupMQTT(cfg *config.ClientConfig) error {
  216. opts := mqtt.NewClientOptions()
  217. server := cfg.Server.Server
  218. port := cfg.Server.MQPort
  219. pass, err := os.ReadFile(ncutils.GetNetclientPathSpecific() + "secret-" + cfg.Network)
  220. if err != nil {
  221. return fmt.Errorf("could not read secrets file %w", err)
  222. }
  223. opts.AddBroker(fmt.Sprintf("mqtts://%s:%s", server, port))
  224. opts.SetUsername(cfg.Node.ID)
  225. opts.SetPassword(string(pass))
  226. opts.SetClientID(ncutils.MakeRandomString(23))
  227. opts.SetDefaultPublishHandler(All)
  228. opts.SetAutoReconnect(true)
  229. opts.SetConnectRetry(true)
  230. opts.SetConnectRetryInterval(time.Second << 2)
  231. opts.SetKeepAlive(time.Minute >> 1)
  232. opts.SetWriteTimeout(time.Minute)
  233. opts.SetOnConnectHandler(func(client mqtt.Client) {
  234. networks, err := ncutils.GetSystemNetworks()
  235. if err != nil {
  236. logger.Log(0, "error retriving networks", err.Error())
  237. }
  238. for _, network := range networks {
  239. var currNodeCfg config.ClientConfig
  240. currNodeCfg.Network = network
  241. currNodeCfg.ReadConfig()
  242. setSubscriptions(client, &currNodeCfg)
  243. }
  244. })
  245. opts.SetOrderMatters(true)
  246. opts.SetResumeSubs(true)
  247. opts.SetConnectionLostHandler(func(c mqtt.Client, e error) {
  248. logger.Log(0, "network:", cfg.Node.Network, "detected broker connection lost for", cfg.Server.Server)
  249. })
  250. mqclient = mqtt.NewClient(opts)
  251. var connecterr error
  252. for count := 0; count < 3; count++ {
  253. connecterr = nil
  254. if token := mqclient.Connect(); !token.WaitTimeout(30*time.Second) || token.Error() != nil {
  255. logger.Log(0, "unable to connect to broker, retrying ...")
  256. if token.Error() == nil {
  257. connecterr = errors.New("connect timeout")
  258. } else {
  259. connecterr = token.Error()
  260. }
  261. if err := checkBroker(cfg.Server.Server, cfg.Server.MQPort); err != nil {
  262. logger.Log(0, "could not connect to broker", cfg.Server.Server, err.Error())
  263. }
  264. }
  265. }
  266. if connecterr != nil {
  267. logger.Log(0, "failed to establish connection to broker: ", connecterr.Error())
  268. return connecterr
  269. }
  270. return nil
  271. }
  272. // publishes a message to server to update peers on this peer's behalf
  273. func publishSignal(nodeCfg *config.ClientConfig, signal byte) error {
  274. if err := publish(nodeCfg, fmt.Sprintf("signal/%s", nodeCfg.Node.ID), []byte{signal}, 1); err != nil {
  275. return err
  276. }
  277. return nil
  278. }
  279. func parseNetworkFromTopic(topic string) string {
  280. return strings.Split(topic, "/")[1]
  281. }
  282. // should only ever use node client configs
  283. func decryptMsg(nodeCfg *config.ClientConfig, msg []byte) ([]byte, error) {
  284. if len(msg) <= 24 { // make sure message is of appropriate length
  285. return nil, fmt.Errorf("recieved invalid message from broker %v", msg)
  286. }
  287. // setup the keys
  288. diskKey, keyErr := auth.RetrieveTrafficKey(nodeCfg.Node.Network)
  289. if keyErr != nil {
  290. return nil, keyErr
  291. }
  292. serverPubKey, err := ncutils.ConvertBytesToKey(nodeCfg.Node.TrafficKeys.Server)
  293. if err != nil {
  294. return nil, err
  295. }
  296. return ncutils.DeChunk(msg, serverPubKey, diskKey)
  297. }
  298. // == Message Caches ==
  299. func insert(network, which, cache string) {
  300. var newMessage = cachedMessage{
  301. Message: cache,
  302. LastSeen: time.Now(),
  303. }
  304. messageCache.Store(fmt.Sprintf("%s%s", network, which), newMessage)
  305. }
  306. func read(network, which string) string {
  307. val, isok := messageCache.Load(fmt.Sprintf("%s%s", network, which))
  308. if isok {
  309. var readMessage = val.(cachedMessage) // fetch current cached message
  310. if readMessage.LastSeen.IsZero() {
  311. return ""
  312. }
  313. if time.Now().After(readMessage.LastSeen.Add(time.Hour * 24)) { // check if message has been there over a minute
  314. messageCache.Delete(fmt.Sprintf("%s%s", network, which)) // remove old message if expired
  315. return ""
  316. }
  317. return readMessage.Message // return current message if not expired
  318. }
  319. return ""
  320. }