daemon.go 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374
  1. package functions
  2. import (
  3. "context"
  4. "crypto/tls"
  5. "crypto/x509"
  6. "errors"
  7. "fmt"
  8. "os"
  9. "os/signal"
  10. "strings"
  11. "sync"
  12. "syscall"
  13. "time"
  14. mqtt "github.com/eclipse/paho.mqtt.golang"
  15. "github.com/gravitl/netmaker/logger"
  16. "github.com/gravitl/netmaker/mq"
  17. "github.com/gravitl/netmaker/netclient/auth"
  18. "github.com/gravitl/netmaker/netclient/config"
  19. "github.com/gravitl/netmaker/netclient/global_settings"
  20. "github.com/gravitl/netmaker/netclient/local"
  21. "github.com/gravitl/netmaker/netclient/ncutils"
  22. "github.com/gravitl/netmaker/netclient/wireguard"
  23. "golang.zx2c4.com/wireguard/wgctrl/wgtypes"
  24. )
  25. var messageCache = new(sync.Map)
  26. var serverSet map[string]bool
  27. var mqclient mqtt.Client
  28. const lastNodeUpdate = "lnu"
  29. const lastPeerUpdate = "lpu"
  30. type cachedMessage struct {
  31. Message string
  32. LastSeen time.Time
  33. }
  34. // Daemon runs netclient daemon from command line
  35. func Daemon() error {
  36. logger.Log(0, "netclient daemon started -- version:", ncutils.Version)
  37. UpdateClientConfig()
  38. if err := ncutils.SavePID(); err != nil {
  39. return err
  40. }
  41. // reference required to eliminate unused statticcheck
  42. serverSet = make(map[string]bool)
  43. serverSet["dummy"] = false
  44. // set ipforwarding on startup
  45. err := local.SetIPForwarding()
  46. if err != nil {
  47. logger.Log(0, err.Error())
  48. }
  49. // == add waitgroup and cancel for checkin routine ==
  50. wg := sync.WaitGroup{}
  51. quit := make(chan os.Signal, 1)
  52. reset := make(chan os.Signal, 1)
  53. signal.Notify(quit, syscall.SIGTERM, os.Interrupt)
  54. signal.Notify(reset, syscall.SIGHUP)
  55. cancel := startGoRoutines(&wg)
  56. for {
  57. select {
  58. case <-quit:
  59. cancel()
  60. logger.Log(0, "shutting down netclient daemon")
  61. wg.Wait()
  62. logger.Log(0, "shutdown complete")
  63. return nil
  64. case <-reset:
  65. logger.Log(0, "received reset")
  66. cancel()
  67. wg.Wait()
  68. logger.Log(0, "restarting daemon")
  69. cancel = startGoRoutines(&wg)
  70. }
  71. }
  72. }
  73. func startGoRoutines(wg *sync.WaitGroup) context.CancelFunc {
  74. ctx, cancel := context.WithCancel(context.Background())
  75. serverSet := make(map[string]bool)
  76. networks, _ := ncutils.GetSystemNetworks()
  77. for _, network := range networks {
  78. logger.Log(3, "initializing network", network)
  79. cfg := config.ClientConfig{}
  80. cfg.Network = network
  81. cfg.ReadConfig()
  82. if cfg.Node.Connected == "yes" {
  83. if err := wireguard.ApplyConf(&cfg.Node, cfg.Node.Interface, ncutils.GetNetclientPathSpecific()+cfg.Node.Interface+".conf"); err != nil {
  84. logger.Log(0, "failed to start ", cfg.Node.Interface, "wg interface", err.Error())
  85. }
  86. if cfg.PublicIPService != "" {
  87. global_settings.PublicIPServices[network] = cfg.PublicIPService
  88. }
  89. }
  90. server := cfg.Server.Server
  91. if !serverSet[server] {
  92. // == subscribe to all nodes for each on machine ==
  93. serverSet[server] = true
  94. logger.Log(1, "started daemon for server ", server)
  95. local.SetNetmakerDomainRoute(cfg.Server.API)
  96. wg.Add(1)
  97. go messageQueue(ctx, wg, &cfg)
  98. }
  99. }
  100. wg.Add(1)
  101. go Checkin(ctx, wg)
  102. return cancel
  103. }
  104. // UpdateKeys -- updates private key and returns new publickey
  105. func UpdateKeys(nodeCfg *config.ClientConfig, client mqtt.Client) error {
  106. logger.Log(0, "interface:", nodeCfg.Node.Interface, "received message to update wireguard keys for network ", nodeCfg.Network)
  107. key, err := wgtypes.GeneratePrivateKey()
  108. if err != nil {
  109. logger.Log(0, "network:", nodeCfg.Node.Network, "error generating privatekey ", err.Error())
  110. return err
  111. }
  112. file := ncutils.GetNetclientPathSpecific() + nodeCfg.Node.Interface + ".conf"
  113. if err := wireguard.UpdatePrivateKey(file, key.String()); err != nil {
  114. logger.Log(0, "network:", nodeCfg.Node.Network, "error updating wireguard key ", err.Error())
  115. return err
  116. }
  117. if storeErr := wireguard.StorePrivKey(key.String(), nodeCfg.Network); storeErr != nil {
  118. logger.Log(0, "network:", nodeCfg.Network, "failed to save private key", storeErr.Error())
  119. return storeErr
  120. }
  121. nodeCfg.Node.PublicKey = key.PublicKey().String()
  122. PublishNodeUpdate(nodeCfg)
  123. return nil
  124. }
  125. // == Private ==
  126. // sets MQ client subscriptions for a specific node config
  127. // should be called for each node belonging to a given server
  128. func setSubscriptions(client mqtt.Client, nodeCfg *config.ClientConfig) {
  129. if token := client.Subscribe(fmt.Sprintf("update/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID), 0, mqtt.MessageHandler(NodeUpdate)); token.WaitTimeout(mq.MQ_TIMEOUT*time.Second) && token.Error() != nil {
  130. if token.Error() == nil {
  131. logger.Log(0, "network:", nodeCfg.Node.Network, "connection timeout")
  132. } else {
  133. logger.Log(0, "network:", nodeCfg.Node.Network, token.Error().Error())
  134. }
  135. return
  136. }
  137. logger.Log(3, fmt.Sprintf("subscribed to node updates for node %s update/%s/%s", nodeCfg.Node.Name, nodeCfg.Node.Network, nodeCfg.Node.ID))
  138. if token := client.Subscribe(fmt.Sprintf("peers/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID), 0, mqtt.MessageHandler(UpdatePeers)); token.Wait() && token.Error() != nil {
  139. logger.Log(0, "network", nodeCfg.Node.Network, token.Error().Error())
  140. return
  141. }
  142. logger.Log(3, fmt.Sprintf("subscribed to peer updates for node %s peers/%s/%s", nodeCfg.Node.Name, nodeCfg.Node.Network, nodeCfg.Node.ID))
  143. }
  144. // on a delete usually, pass in the nodecfg to unsubscribe client broker communications
  145. // for the node in nodeCfg
  146. func unsubscribeNode(client mqtt.Client, nodeCfg *config.ClientConfig) {
  147. client.Unsubscribe(fmt.Sprintf("update/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID))
  148. var ok = true
  149. if token := client.Unsubscribe(fmt.Sprintf("update/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID)); token.WaitTimeout(mq.MQ_TIMEOUT*time.Second) && token.Error() != nil {
  150. if token.Error() == nil {
  151. logger.Log(1, "network:", nodeCfg.Node.Network, "unable to unsubscribe from updates for node ", nodeCfg.Node.Name, "\n", "connection timeout")
  152. } else {
  153. logger.Log(1, "network:", nodeCfg.Node.Network, "unable to unsubscribe from updates for node ", nodeCfg.Node.Name, "\n", token.Error().Error())
  154. }
  155. ok = false
  156. }
  157. if token := client.Unsubscribe(fmt.Sprintf("peers/%s/%s", nodeCfg.Node.Network, nodeCfg.Node.ID)); token.WaitTimeout(mq.MQ_TIMEOUT*time.Second) && token.Error() != nil {
  158. if token.Error() == nil {
  159. logger.Log(1, "network:", nodeCfg.Node.Network, "unable to unsubscribe from peer updates for node", nodeCfg.Node.Name, "\n", "connection timeout")
  160. } else {
  161. logger.Log(1, "network:", nodeCfg.Node.Network, "unable to unsubscribe from peer updates for node", nodeCfg.Node.Name, "\n", token.Error().Error())
  162. }
  163. ok = false
  164. }
  165. if ok {
  166. logger.Log(1, "network:", nodeCfg.Node.Network, "successfully unsubscribed node ", nodeCfg.Node.ID, " : ", nodeCfg.Node.Name)
  167. }
  168. }
  169. // sets up Message Queue and subsribes/publishes updates to/from server
  170. // the client should subscribe to ALL nodes that exist on server locally
  171. func messageQueue(ctx context.Context, wg *sync.WaitGroup, cfg *config.ClientConfig) {
  172. defer wg.Done()
  173. logger.Log(0, "network:", cfg.Node.Network, "netclient message queue started for server:", cfg.Server.Server)
  174. err := setupMQTT(cfg)
  175. if err != nil {
  176. logger.Log(0, "unable to connect to broker", cfg.Server.Server, err.Error())
  177. return
  178. }
  179. //defer mqclient.Disconnect(250)
  180. <-ctx.Done()
  181. logger.Log(0, "shutting down message queue for server", cfg.Server.Server)
  182. }
  183. // NewTLSConf sets up tls configuration to connect to broker securely
  184. func NewTLSConfig(server string) (*tls.Config, error) {
  185. file := ncutils.GetNetclientServerPath(server) + ncutils.GetSeparator() + "root.pem"
  186. certpool := x509.NewCertPool()
  187. ca, err := os.ReadFile(file)
  188. if err != nil {
  189. logger.Log(0, "could not read CA file", err.Error())
  190. }
  191. ok := certpool.AppendCertsFromPEM(ca)
  192. if !ok {
  193. logger.Log(0, "failed to append cert")
  194. }
  195. clientKeyPair, err := tls.LoadX509KeyPair(ncutils.GetNetclientServerPath(server)+ncutils.GetSeparator()+"client.pem", ncutils.GetNetclientPath()+ncutils.GetSeparator()+"client.key")
  196. if err != nil {
  197. logger.Log(0, "could not read client cert/key", err.Error())
  198. return nil, err
  199. }
  200. certs := []tls.Certificate{clientKeyPair}
  201. return &tls.Config{
  202. RootCAs: certpool,
  203. ClientAuth: tls.NoClientCert,
  204. ClientCAs: nil,
  205. Certificates: certs,
  206. InsecureSkipVerify: false,
  207. }, nil
  208. }
  209. // func setMQTTSingenton creates a connection to broker for single use (ie to publish a message)
  210. // only to be called from cli (eg. connect/disconnect, join, leave) and not from daemon ---
  211. func setupMQTTSingleton(cfg *config.ClientConfig) error {
  212. opts := mqtt.NewClientOptions()
  213. server := cfg.Server.Server
  214. port := cfg.Server.MQPort
  215. pass, err := os.ReadFile(ncutils.GetNetclientPathSpecific() + "secret-" + cfg.Network)
  216. if err != nil {
  217. return fmt.Errorf("could not read secrets file %w", err)
  218. }
  219. opts.AddBroker("mqtts://" + server + ":" + port)
  220. opts.SetUsername(cfg.Node.ID)
  221. opts.SetPassword(string(pass))
  222. mqclient := mqtt.NewClient(opts)
  223. var connecterr error
  224. opts.SetClientID(ncutils.MakeRandomString(23))
  225. if token := mqclient.Connect(); !token.WaitTimeout(30*time.Second) || token.Error() != nil {
  226. logger.Log(0, "unable to connect to broker, retrying ...")
  227. if token.Error() == nil {
  228. connecterr = errors.New("connect timeout")
  229. } else {
  230. connecterr = token.Error()
  231. }
  232. }
  233. return connecterr
  234. }
  235. // setupMQTT creates a connection to broker and returns client
  236. // this function is primarily used to create a connection to publish to the broker
  237. func setupMQTT(cfg *config.ClientConfig) error {
  238. opts := mqtt.NewClientOptions()
  239. server := cfg.Server.Server
  240. port := cfg.Server.MQPort
  241. pass, err := os.ReadFile(ncutils.GetNetclientPathSpecific() + "secret-" + cfg.Network)
  242. if err != nil {
  243. return fmt.Errorf("could not read secrets file %w", err)
  244. }
  245. opts.AddBroker(fmt.Sprintf("mqtts://%s:%s", server, port))
  246. opts.SetUsername(cfg.Node.ID)
  247. opts.SetPassword(string(pass))
  248. opts.SetClientID(ncutils.MakeRandomString(23))
  249. opts.SetDefaultPublishHandler(All)
  250. opts.SetAutoReconnect(true)
  251. opts.SetConnectRetry(true)
  252. opts.SetConnectRetryInterval(time.Second << 2)
  253. opts.SetKeepAlive(time.Minute >> 1)
  254. opts.SetWriteTimeout(time.Minute)
  255. opts.SetOnConnectHandler(func(client mqtt.Client) {
  256. networks, err := ncutils.GetSystemNetworks()
  257. if err != nil {
  258. logger.Log(0, "error retriving networks", err.Error())
  259. }
  260. for _, network := range networks {
  261. var currNodeCfg config.ClientConfig
  262. currNodeCfg.Network = network
  263. currNodeCfg.ReadConfig()
  264. setSubscriptions(client, &currNodeCfg)
  265. }
  266. })
  267. opts.SetOrderMatters(true)
  268. opts.SetResumeSubs(true)
  269. opts.SetConnectionLostHandler(func(c mqtt.Client, e error) {
  270. logger.Log(0, "network:", cfg.Node.Network, "detected broker connection lost for", cfg.Server.Server)
  271. })
  272. mqclient = mqtt.NewClient(opts)
  273. var connecterr error
  274. for count := 0; count < 3; count++ {
  275. connecterr = nil
  276. if token := mqclient.Connect(); !token.WaitTimeout(30*time.Second) || token.Error() != nil {
  277. logger.Log(0, "unable to connect to broker, retrying ...")
  278. if token.Error() == nil {
  279. connecterr = errors.New("connect timeout")
  280. } else {
  281. connecterr = token.Error()
  282. }
  283. if err := checkBroker(cfg.Server.Server, cfg.Server.MQPort); err != nil {
  284. logger.Log(0, "could not connect to broker", cfg.Server.Server, err.Error())
  285. }
  286. }
  287. }
  288. if connecterr != nil {
  289. logger.Log(0, "failed to establish connection to broker: ", connecterr.Error())
  290. return connecterr
  291. }
  292. return nil
  293. }
  294. // publishes a message to server to update peers on this peer's behalf
  295. func publishSignal(nodeCfg *config.ClientConfig, signal byte) error {
  296. if err := publish(nodeCfg, fmt.Sprintf("signal/%s", nodeCfg.Node.ID), []byte{signal}, 1); err != nil {
  297. return err
  298. }
  299. return nil
  300. }
  301. func parseNetworkFromTopic(topic string) string {
  302. return strings.Split(topic, "/")[1]
  303. }
  304. // should only ever use node client configs
  305. func decryptMsg(nodeCfg *config.ClientConfig, msg []byte) ([]byte, error) {
  306. if len(msg) <= 24 { // make sure message is of appropriate length
  307. return nil, fmt.Errorf("recieved invalid message from broker %v", msg)
  308. }
  309. // setup the keys
  310. diskKey, keyErr := auth.RetrieveTrafficKey(nodeCfg.Node.Network)
  311. if keyErr != nil {
  312. return nil, keyErr
  313. }
  314. serverPubKey, err := ncutils.ConvertBytesToKey(nodeCfg.Node.TrafficKeys.Server)
  315. if err != nil {
  316. return nil, err
  317. }
  318. return ncutils.DeChunk(msg, serverPubKey, diskKey)
  319. }
  320. // == Message Caches ==
  321. func insert(network, which, cache string) {
  322. var newMessage = cachedMessage{
  323. Message: cache,
  324. LastSeen: time.Now(),
  325. }
  326. messageCache.Store(fmt.Sprintf("%s%s", network, which), newMessage)
  327. }
  328. func read(network, which string) string {
  329. val, isok := messageCache.Load(fmt.Sprintf("%s%s", network, which))
  330. if isok {
  331. var readMessage = val.(cachedMessage) // fetch current cached message
  332. if readMessage.LastSeen.IsZero() {
  333. return ""
  334. }
  335. if time.Now().After(readMessage.LastSeen.Add(time.Hour * 24)) { // check if message has been there over a minute
  336. messageCache.Delete(fmt.Sprintf("%s%s", network, which)) // remove old message if expired
  337. return ""
  338. }
  339. return readMessage.Message // return current message if not expired
  340. }
  341. return ""
  342. }