interface.go 9.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332
  1. package nebula
  2. import (
  3. "context"
  4. "errors"
  5. "io"
  6. "os"
  7. "runtime"
  8. "sync/atomic"
  9. "time"
  10. "github.com/rcrowley/go-metrics"
  11. "github.com/sirupsen/logrus"
  12. "github.com/slackhq/nebula/cert"
  13. "github.com/slackhq/nebula/config"
  14. "github.com/slackhq/nebula/firewall"
  15. "github.com/slackhq/nebula/iputil"
  16. "github.com/slackhq/nebula/overlay"
  17. "github.com/slackhq/nebula/udp"
  18. )
  19. const mtu = 9001
  20. type InterfaceConfig struct {
  21. HostMap *HostMap
  22. Outside *udp.Conn
  23. Inside overlay.Device
  24. certState *CertState
  25. Cipher string
  26. Firewall *Firewall
  27. ServeDns bool
  28. HandshakeManager *HandshakeManager
  29. lightHouse *LightHouse
  30. checkInterval int
  31. pendingDeletionInterval int
  32. DropLocalBroadcast bool
  33. DropMulticast bool
  34. routines int
  35. MessageMetrics *MessageMetrics
  36. version string
  37. caPool *cert.NebulaCAPool
  38. disconnectInvalid bool
  39. ConntrackCacheTimeout time.Duration
  40. l *logrus.Logger
  41. }
  42. type Interface struct {
  43. hostMap *HostMap
  44. outside *udp.Conn
  45. inside overlay.Device
  46. certState *CertState
  47. cipher string
  48. firewall *Firewall
  49. connectionManager *connectionManager
  50. handshakeManager *HandshakeManager
  51. serveDns bool
  52. createTime time.Time
  53. lightHouse *LightHouse
  54. localBroadcast iputil.VpnIp
  55. myVpnIp iputil.VpnIp
  56. dropLocalBroadcast bool
  57. dropMulticast bool
  58. routines int
  59. caPool *cert.NebulaCAPool
  60. disconnectInvalid bool
  61. closed int32
  62. // rebindCount is used to decide if an active tunnel should trigger a punch notification through a lighthouse
  63. rebindCount int8
  64. version string
  65. conntrackCacheTimeout time.Duration
  66. writers []*udp.Conn
  67. readers []io.ReadWriteCloser
  68. metricHandshakes metrics.Histogram
  69. messageMetrics *MessageMetrics
  70. cachedPacketMetrics *cachedPacketMetrics
  71. l *logrus.Logger
  72. }
  73. func NewInterface(ctx context.Context, c *InterfaceConfig) (*Interface, error) {
  74. if c.Outside == nil {
  75. return nil, errors.New("no outside connection")
  76. }
  77. if c.Inside == nil {
  78. return nil, errors.New("no inside interface (tun)")
  79. }
  80. if c.certState == nil {
  81. return nil, errors.New("no certificate state")
  82. }
  83. if c.Firewall == nil {
  84. return nil, errors.New("no firewall rules")
  85. }
  86. myVpnIp := iputil.Ip2VpnIp(c.certState.certificate.Details.Ips[0].IP)
  87. ifce := &Interface{
  88. hostMap: c.HostMap,
  89. outside: c.Outside,
  90. inside: c.Inside,
  91. certState: c.certState,
  92. cipher: c.Cipher,
  93. firewall: c.Firewall,
  94. serveDns: c.ServeDns,
  95. handshakeManager: c.HandshakeManager,
  96. createTime: time.Now(),
  97. lightHouse: c.lightHouse,
  98. localBroadcast: myVpnIp | ^iputil.Ip2VpnIp(c.certState.certificate.Details.Ips[0].Mask),
  99. dropLocalBroadcast: c.DropLocalBroadcast,
  100. dropMulticast: c.DropMulticast,
  101. routines: c.routines,
  102. version: c.version,
  103. writers: make([]*udp.Conn, c.routines),
  104. readers: make([]io.ReadWriteCloser, c.routines),
  105. caPool: c.caPool,
  106. disconnectInvalid: c.disconnectInvalid,
  107. myVpnIp: myVpnIp,
  108. conntrackCacheTimeout: c.ConntrackCacheTimeout,
  109. metricHandshakes: metrics.GetOrRegisterHistogram("handshakes", nil, metrics.NewExpDecaySample(1028, 0.015)),
  110. messageMetrics: c.MessageMetrics,
  111. cachedPacketMetrics: &cachedPacketMetrics{
  112. sent: metrics.GetOrRegisterCounter("hostinfo.cached_packets.sent", nil),
  113. dropped: metrics.GetOrRegisterCounter("hostinfo.cached_packets.dropped", nil),
  114. },
  115. l: c.l,
  116. }
  117. ifce.connectionManager = newConnectionManager(ctx, c.l, ifce, c.checkInterval, c.pendingDeletionInterval)
  118. return ifce, nil
  119. }
  120. // activate creates the interface on the host. After the interface is created, any
  121. // other services that want to bind listeners to its IP may do so successfully. However,
  122. // the interface isn't going to process anything until run() is called.
  123. func (f *Interface) activate() {
  124. // actually turn on tun dev
  125. addr, err := f.outside.LocalAddr()
  126. if err != nil {
  127. f.l.WithError(err).Error("Failed to get udp listen address")
  128. }
  129. f.l.WithField("interface", f.inside.Name()).WithField("network", f.inside.Cidr().String()).
  130. WithField("build", f.version).WithField("udpAddr", addr).
  131. Info("Nebula interface is active")
  132. metrics.GetOrRegisterGauge("routines", nil).Update(int64(f.routines))
  133. // Prepare n tun queues
  134. var reader io.ReadWriteCloser = f.inside
  135. for i := 0; i < f.routines; i++ {
  136. if i > 0 {
  137. reader, err = f.inside.NewMultiQueueReader()
  138. if err != nil {
  139. f.l.Fatal(err)
  140. }
  141. }
  142. f.readers[i] = reader
  143. }
  144. if err := f.inside.Activate(); err != nil {
  145. f.inside.Close()
  146. f.l.Fatal(err)
  147. }
  148. }
  149. func (f *Interface) run() {
  150. // Launch n queues to read packets from udp
  151. for i := 0; i < f.routines; i++ {
  152. go f.listenOut(i)
  153. }
  154. // Launch n queues to read packets from tun dev
  155. for i := 0; i < f.routines; i++ {
  156. go f.listenIn(f.readers[i], i)
  157. }
  158. }
  159. func (f *Interface) listenOut(i int) {
  160. runtime.LockOSThread()
  161. var li *udp.Conn
  162. // TODO clean this up with a coherent interface for each outside connection
  163. if i > 0 {
  164. li = f.writers[i]
  165. } else {
  166. li = f.outside
  167. }
  168. lhh := f.lightHouse.NewRequestHandler()
  169. conntrackCache := firewall.NewConntrackCacheTicker(f.conntrackCacheTimeout)
  170. li.ListenOut(f.readOutsidePackets, lhh.HandleRequest, conntrackCache, i)
  171. }
  172. func (f *Interface) listenIn(reader io.ReadWriteCloser, i int) {
  173. runtime.LockOSThread()
  174. packet := make([]byte, mtu)
  175. out := make([]byte, mtu)
  176. fwPacket := &firewall.Packet{}
  177. nb := make([]byte, 12, 12)
  178. conntrackCache := firewall.NewConntrackCacheTicker(f.conntrackCacheTimeout)
  179. for {
  180. n, err := reader.Read(packet)
  181. if err != nil {
  182. if errors.Is(err, os.ErrClosed) && atomic.LoadInt32(&f.closed) != 0 {
  183. return
  184. }
  185. f.l.WithError(err).Error("Error while reading outbound packet")
  186. // This only seems to happen when something fatal happens to the fd, so exit.
  187. os.Exit(2)
  188. }
  189. f.consumeInsidePacket(packet[:n], fwPacket, nb, out, i, conntrackCache.Get(f.l))
  190. }
  191. }
  192. func (f *Interface) RegisterConfigChangeCallbacks(c *config.C) {
  193. c.RegisterReloadCallback(f.reloadCA)
  194. c.RegisterReloadCallback(f.reloadCertKey)
  195. c.RegisterReloadCallback(f.reloadFirewall)
  196. for _, udpConn := range f.writers {
  197. c.RegisterReloadCallback(udpConn.ReloadConfig)
  198. }
  199. }
  200. func (f *Interface) reloadCA(c *config.C) {
  201. // reload and check regardless
  202. // todo: need mutex?
  203. newCAs, err := loadCAFromConfig(f.l, c)
  204. if err != nil {
  205. f.l.WithError(err).Error("Could not refresh trusted CA certificates")
  206. return
  207. }
  208. f.caPool = newCAs
  209. f.l.WithField("fingerprints", f.caPool.GetFingerprints()).Info("Trusted CA certificates refreshed")
  210. }
  211. func (f *Interface) reloadCertKey(c *config.C) {
  212. // reload and check in all cases
  213. cs, err := NewCertStateFromConfig(c)
  214. if err != nil {
  215. f.l.WithError(err).Error("Could not refresh client cert")
  216. return
  217. }
  218. // did IP in cert change? if so, don't set
  219. oldIPs := f.certState.certificate.Details.Ips
  220. newIPs := cs.certificate.Details.Ips
  221. if len(oldIPs) > 0 && len(newIPs) > 0 && oldIPs[0].String() != newIPs[0].String() {
  222. f.l.WithField("new_ip", newIPs[0]).WithField("old_ip", oldIPs[0]).Error("IP in new cert was different from old")
  223. return
  224. }
  225. f.certState = cs
  226. f.l.WithField("cert", cs.certificate).Info("Client cert refreshed from disk")
  227. }
  228. func (f *Interface) reloadFirewall(c *config.C) {
  229. //TODO: need to trigger/detect if the certificate changed too
  230. if c.HasChanged("firewall") == false {
  231. f.l.Debug("No firewall config change detected")
  232. return
  233. }
  234. fw, err := NewFirewallFromConfig(f.l, f.certState.certificate, c)
  235. if err != nil {
  236. f.l.WithError(err).Error("Error while creating firewall during reload")
  237. return
  238. }
  239. oldFw := f.firewall
  240. conntrack := oldFw.Conntrack
  241. conntrack.Lock()
  242. defer conntrack.Unlock()
  243. fw.rulesVersion = oldFw.rulesVersion + 1
  244. // If rulesVersion is back to zero, we have wrapped all the way around. Be
  245. // safe and just reset conntrack in this case.
  246. if fw.rulesVersion == 0 {
  247. f.l.WithField("firewallHash", fw.GetRuleHash()).
  248. WithField("oldFirewallHash", oldFw.GetRuleHash()).
  249. WithField("rulesVersion", fw.rulesVersion).
  250. Warn("firewall rulesVersion has overflowed, resetting conntrack")
  251. } else {
  252. fw.Conntrack = conntrack
  253. }
  254. f.firewall = fw
  255. oldFw.Destroy()
  256. f.l.WithField("firewallHash", fw.GetRuleHash()).
  257. WithField("oldFirewallHash", oldFw.GetRuleHash()).
  258. WithField("rulesVersion", fw.rulesVersion).
  259. Info("New firewall has been installed")
  260. }
  261. func (f *Interface) emitStats(ctx context.Context, i time.Duration) {
  262. ticker := time.NewTicker(i)
  263. defer ticker.Stop()
  264. udpStats := udp.NewUDPStatsEmitter(f.writers)
  265. for {
  266. select {
  267. case <-ctx.Done():
  268. return
  269. case <-ticker.C:
  270. f.firewall.EmitStats()
  271. f.handshakeManager.EmitStats()
  272. udpStats()
  273. }
  274. }
  275. }
  276. func (f *Interface) Close() error {
  277. atomic.StoreInt32(&f.closed, 1)
  278. // Release the tun device
  279. return f.inside.Close()
  280. }