interface.go 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559
  1. package nebula
  2. import (
  3. "context"
  4. "errors"
  5. "fmt"
  6. "io"
  7. "net/netip"
  8. "runtime"
  9. "sync"
  10. "sync/atomic"
  11. "time"
  12. "github.com/gaissmai/bart"
  13. "github.com/rcrowley/go-metrics"
  14. "github.com/sirupsen/logrus"
  15. "github.com/slackhq/nebula/config"
  16. "github.com/slackhq/nebula/firewall"
  17. "github.com/slackhq/nebula/header"
  18. "github.com/slackhq/nebula/overlay"
  19. "github.com/slackhq/nebula/packet"
  20. "github.com/slackhq/nebula/udp"
  21. )
  22. const mtu = 9001
  23. type InterfaceConfig struct {
  24. HostMap *HostMap
  25. Outside udp.Conn
  26. Inside overlay.Device
  27. pki *PKI
  28. Cipher string
  29. Firewall *Firewall
  30. ServeDns bool
  31. HandshakeManager *HandshakeManager
  32. lightHouse *LightHouse
  33. connectionManager *connectionManager
  34. DropLocalBroadcast bool
  35. DropMulticast bool
  36. routines int
  37. MessageMetrics *MessageMetrics
  38. version string
  39. relayManager *relayManager
  40. punchy *Punchy
  41. tryPromoteEvery uint32
  42. reQueryEvery uint32
  43. reQueryWait time.Duration
  44. ConntrackCacheTimeout time.Duration
  45. l *logrus.Logger
  46. }
  47. type Interface struct {
  48. hostMap *HostMap
  49. outside udp.Conn
  50. inside overlay.Device
  51. pki *PKI
  52. firewall *Firewall
  53. connectionManager *connectionManager
  54. handshakeManager *HandshakeManager
  55. serveDns bool
  56. createTime time.Time
  57. lightHouse *LightHouse
  58. myBroadcastAddrsTable *bart.Lite
  59. myVpnAddrs []netip.Addr // A list of addresses assigned to us via our certificate
  60. myVpnAddrsTable *bart.Lite
  61. myVpnNetworks []netip.Prefix // A list of networks assigned to us via our certificate
  62. myVpnNetworksTable *bart.Lite
  63. dropLocalBroadcast bool
  64. dropMulticast bool
  65. routines int
  66. disconnectInvalid atomic.Bool
  67. closed atomic.Bool
  68. relayManager *relayManager
  69. tryPromoteEvery atomic.Uint32
  70. reQueryEvery atomic.Uint32
  71. reQueryWait atomic.Int64
  72. sendRecvErrorConfig sendRecvErrorConfig
  73. // rebindCount is used to decide if an active tunnel should trigger a punch notification through a lighthouse
  74. rebindCount int8
  75. version string
  76. conntrackCacheTimeout time.Duration
  77. writers []udp.Conn
  78. readers []io.ReadWriteCloser
  79. wg sync.WaitGroup
  80. metricHandshakes metrics.Histogram
  81. messageMetrics *MessageMetrics
  82. cachedPacketMetrics *cachedPacketMetrics
  83. l *logrus.Logger
  84. inPool sync.Pool
  85. inbound chan *packet.Packet
  86. outPool sync.Pool
  87. outbound chan *[]byte
  88. }
  89. type EncWriter interface {
  90. SendVia(via *HostInfo,
  91. relay *Relay,
  92. ad,
  93. nb,
  94. out []byte,
  95. nocopy bool,
  96. )
  97. SendMessageToVpnAddr(t header.MessageType, st header.MessageSubType, vpnAddr netip.Addr, p, nb, out []byte)
  98. SendMessageToHostInfo(t header.MessageType, st header.MessageSubType, hostinfo *HostInfo, p, nb, out []byte)
  99. Handshake(vpnAddr netip.Addr)
  100. GetHostInfo(vpnAddr netip.Addr) *HostInfo
  101. GetCertState() *CertState
  102. }
  103. type sendRecvErrorConfig uint8
  104. const (
  105. sendRecvErrorAlways sendRecvErrorConfig = iota
  106. sendRecvErrorNever
  107. sendRecvErrorPrivate
  108. )
  109. func (s sendRecvErrorConfig) ShouldSendRecvError(endpoint netip.AddrPort) bool {
  110. switch s {
  111. case sendRecvErrorPrivate:
  112. return endpoint.Addr().IsPrivate()
  113. case sendRecvErrorAlways:
  114. return true
  115. case sendRecvErrorNever:
  116. return false
  117. default:
  118. panic(fmt.Errorf("invalid sendRecvErrorConfig value: %d", s))
  119. }
  120. }
  121. func (s sendRecvErrorConfig) String() string {
  122. switch s {
  123. case sendRecvErrorAlways:
  124. return "always"
  125. case sendRecvErrorNever:
  126. return "never"
  127. case sendRecvErrorPrivate:
  128. return "private"
  129. default:
  130. return fmt.Sprintf("invalid(%d)", s)
  131. }
  132. }
  133. func NewInterface(ctx context.Context, c *InterfaceConfig) (*Interface, error) {
  134. if c.Outside == nil {
  135. return nil, errors.New("no outside connection")
  136. }
  137. if c.Inside == nil {
  138. return nil, errors.New("no inside interface (tun)")
  139. }
  140. if c.pki == nil {
  141. return nil, errors.New("no certificate state")
  142. }
  143. if c.Firewall == nil {
  144. return nil, errors.New("no firewall rules")
  145. }
  146. if c.connectionManager == nil {
  147. return nil, errors.New("no connection manager")
  148. }
  149. cs := c.pki.getCertState()
  150. ifce := &Interface{
  151. pki: c.pki,
  152. hostMap: c.HostMap,
  153. outside: c.Outside,
  154. inside: c.Inside,
  155. firewall: c.Firewall,
  156. serveDns: c.ServeDns,
  157. handshakeManager: c.HandshakeManager,
  158. createTime: time.Now(),
  159. lightHouse: c.lightHouse,
  160. dropLocalBroadcast: c.DropLocalBroadcast,
  161. dropMulticast: c.DropMulticast,
  162. routines: c.routines,
  163. version: c.version,
  164. writers: make([]udp.Conn, c.routines),
  165. readers: make([]io.ReadWriteCloser, c.routines),
  166. myVpnNetworks: cs.myVpnNetworks,
  167. myVpnNetworksTable: cs.myVpnNetworksTable,
  168. myVpnAddrs: cs.myVpnAddrs,
  169. myVpnAddrsTable: cs.myVpnAddrsTable,
  170. myBroadcastAddrsTable: cs.myVpnBroadcastAddrsTable,
  171. relayManager: c.relayManager,
  172. connectionManager: c.connectionManager,
  173. conntrackCacheTimeout: c.ConntrackCacheTimeout,
  174. metricHandshakes: metrics.GetOrRegisterHistogram("handshakes", nil, metrics.NewExpDecaySample(1028, 0.015)),
  175. messageMetrics: c.MessageMetrics,
  176. cachedPacketMetrics: &cachedPacketMetrics{
  177. sent: metrics.GetOrRegisterCounter("hostinfo.cached_packets.sent", nil),
  178. dropped: metrics.GetOrRegisterCounter("hostinfo.cached_packets.dropped", nil),
  179. },
  180. //TODO: configurable size
  181. inbound: make(chan *packet.Packet, 1028),
  182. outbound: make(chan *[]byte, 1028),
  183. l: c.l,
  184. }
  185. ifce.inPool = sync.Pool{New: func() any {
  186. return packet.New()
  187. }}
  188. ifce.outPool = sync.Pool{New: func() any {
  189. t := make([]byte, mtu)
  190. return &t
  191. }}
  192. ifce.tryPromoteEvery.Store(c.tryPromoteEvery)
  193. ifce.reQueryEvery.Store(c.reQueryEvery)
  194. ifce.reQueryWait.Store(int64(c.reQueryWait))
  195. ifce.connectionManager.intf = ifce
  196. return ifce, nil
  197. }
  198. // activate creates the interface on the host. After the interface is created, any
  199. // other services that want to bind listeners to its IP may do so successfully. However,
  200. // the interface isn't going to process anything until run() is called.
  201. func (f *Interface) activate() error {
  202. // actually turn on tun dev
  203. addr, err := f.outside.LocalAddr()
  204. if err != nil {
  205. f.l.WithError(err).Error("Failed to get udp listen address")
  206. }
  207. f.l.WithField("interface", f.inside.Name()).WithField("networks", f.myVpnNetworks).
  208. WithField("build", f.version).WithField("udpAddr", addr).
  209. WithField("boringcrypto", boringEnabled()).
  210. Info("Nebula interface is active")
  211. metrics.GetOrRegisterGauge("routines", nil).Update(int64(f.routines))
  212. // Prepare n tun queues
  213. var reader io.ReadWriteCloser = f.inside
  214. for i := 0; i < f.routines; i++ {
  215. if i > 0 {
  216. reader, err = f.inside.NewMultiQueueReader()
  217. if err != nil {
  218. return err
  219. }
  220. }
  221. f.readers[i] = reader
  222. }
  223. if err = f.inside.Activate(); err != nil {
  224. f.inside.Close()
  225. return err
  226. }
  227. return nil
  228. }
  229. func (f *Interface) run(c context.Context) (func(), error) {
  230. for i := 0; i < f.routines; i++ {
  231. // Launch n queues to read packets from udp
  232. f.wg.Add(1)
  233. go f.listenOut(i)
  234. // Launch n queues to read packets from tun dev
  235. f.wg.Add(1)
  236. go f.listenIn(f.readers[i], i)
  237. // Launch n queues to read packets from tun dev
  238. f.wg.Add(1)
  239. go f.workerIn(i, c)
  240. // Launch n queues to read packets from tun dev
  241. f.wg.Add(1)
  242. go f.workerOut(i, c)
  243. }
  244. return f.wg.Wait, nil
  245. }
  246. func (f *Interface) listenOut(i int) {
  247. runtime.LockOSThread()
  248. var li udp.Conn
  249. if i > 0 {
  250. li = f.writers[i]
  251. } else {
  252. li = f.outside
  253. }
  254. err := li.ListenOut(func(fromUdpAddr netip.AddrPort, payload []byte) {
  255. p := f.inPool.Get().(*packet.Packet)
  256. //TODO: have the listener store this in the msgs array after a read instead of doing a copy
  257. p.Payload = p.Payload[:mtu]
  258. copy(p.Payload, payload)
  259. p.Payload = p.Payload[:len(payload)]
  260. p.Addr = fromUdpAddr
  261. f.inbound <- p
  262. //select {
  263. //case f.inbound <- p:
  264. //default:
  265. // f.l.Error("Dropped packet from inbound channel")
  266. //}
  267. })
  268. if err != nil && !f.closed.Load() {
  269. f.l.WithError(err).Error("Error while reading packet inbound packet, closing")
  270. //TODO: Trigger Control to close
  271. }
  272. f.l.Debugf("underlay reader %v is done", i)
  273. f.wg.Done()
  274. }
  275. func (f *Interface) listenIn(reader io.ReadWriteCloser, i int) {
  276. runtime.LockOSThread()
  277. for {
  278. p := f.outPool.Get().(*[]byte)
  279. *p = (*p)[:mtu]
  280. n, err := reader.Read(*p)
  281. if err != nil {
  282. if !f.closed.Load() {
  283. f.l.WithError(err).Error("Error while reading outbound packet, closing")
  284. //TODO: Trigger Control to close
  285. }
  286. break
  287. }
  288. *p = (*p)[:n]
  289. //TODO: nonblocking channel write
  290. f.outbound <- p
  291. //select {
  292. //case f.outbound <- p:
  293. //default:
  294. // f.l.Error("Dropped packet from outbound channel")
  295. //}
  296. }
  297. f.l.Debugf("overlay reader %v is done", i)
  298. f.wg.Done()
  299. }
  300. func (f *Interface) workerIn(i int, ctx context.Context) {
  301. lhh := f.lightHouse.NewRequestHandler()
  302. conntrackCache := firewall.NewConntrackCacheTicker(f.conntrackCacheTimeout)
  303. fwPacket2 := &firewall.Packet{}
  304. nb2 := make([]byte, 12, 12)
  305. result2 := make([]byte, mtu)
  306. h := &header.H{}
  307. for {
  308. select {
  309. case p := <-f.inbound:
  310. f.readOutsidePackets(p.Addr, nil, result2[:0], p.Payload, h, fwPacket2, lhh, nb2, i, conntrackCache.Get(f.l))
  311. p.Payload = p.Payload[:mtu]
  312. f.inPool.Put(p)
  313. case <-ctx.Done():
  314. f.wg.Done()
  315. return
  316. }
  317. }
  318. }
  319. func (f *Interface) workerOut(i int, ctx context.Context) {
  320. conntrackCache := firewall.NewConntrackCacheTicker(f.conntrackCacheTimeout)
  321. fwPacket1 := &firewall.Packet{}
  322. nb1 := make([]byte, 12, 12)
  323. result1 := make([]byte, mtu)
  324. for {
  325. select {
  326. case data := <-f.outbound:
  327. f.consumeInsidePacket(*data, fwPacket1, nb1, result1, i, conntrackCache.Get(f.l))
  328. *data = (*data)[:mtu]
  329. f.outPool.Put(data)
  330. case <-ctx.Done():
  331. f.wg.Done()
  332. return
  333. }
  334. }
  335. }
  336. func (f *Interface) RegisterConfigChangeCallbacks(c *config.C) {
  337. c.RegisterReloadCallback(f.reloadFirewall)
  338. c.RegisterReloadCallback(f.reloadSendRecvError)
  339. c.RegisterReloadCallback(f.reloadDisconnectInvalid)
  340. c.RegisterReloadCallback(f.reloadMisc)
  341. for _, udpConn := range f.writers {
  342. c.RegisterReloadCallback(udpConn.ReloadConfig)
  343. }
  344. }
  345. func (f *Interface) reloadDisconnectInvalid(c *config.C) {
  346. initial := c.InitialLoad()
  347. if initial || c.HasChanged("pki.disconnect_invalid") {
  348. f.disconnectInvalid.Store(c.GetBool("pki.disconnect_invalid", true))
  349. if !initial {
  350. f.l.Infof("pki.disconnect_invalid changed to %v", f.disconnectInvalid.Load())
  351. }
  352. }
  353. }
  354. func (f *Interface) reloadFirewall(c *config.C) {
  355. //TODO: need to trigger/detect if the certificate changed too
  356. if c.HasChanged("firewall") == false {
  357. f.l.Debug("No firewall config change detected")
  358. return
  359. }
  360. fw, err := NewFirewallFromConfig(f.l, f.pki.getCertState(), c)
  361. if err != nil {
  362. f.l.WithError(err).Error("Error while creating firewall during reload")
  363. return
  364. }
  365. oldFw := f.firewall
  366. conntrack := oldFw.Conntrack
  367. conntrack.Lock()
  368. defer conntrack.Unlock()
  369. fw.rulesVersion = oldFw.rulesVersion + 1
  370. // If rulesVersion is back to zero, we have wrapped all the way around. Be
  371. // safe and just reset conntrack in this case.
  372. if fw.rulesVersion == 0 {
  373. f.l.WithField("firewallHashes", fw.GetRuleHashes()).
  374. WithField("oldFirewallHashes", oldFw.GetRuleHashes()).
  375. WithField("rulesVersion", fw.rulesVersion).
  376. Warn("firewall rulesVersion has overflowed, resetting conntrack")
  377. } else {
  378. fw.Conntrack = conntrack
  379. }
  380. f.firewall = fw
  381. oldFw.Destroy()
  382. f.l.WithField("firewallHashes", fw.GetRuleHashes()).
  383. WithField("oldFirewallHashes", oldFw.GetRuleHashes()).
  384. WithField("rulesVersion", fw.rulesVersion).
  385. Info("New firewall has been installed")
  386. }
  387. func (f *Interface) reloadSendRecvError(c *config.C) {
  388. if c.InitialLoad() || c.HasChanged("listen.send_recv_error") {
  389. stringValue := c.GetString("listen.send_recv_error", "always")
  390. switch stringValue {
  391. case "always":
  392. f.sendRecvErrorConfig = sendRecvErrorAlways
  393. case "never":
  394. f.sendRecvErrorConfig = sendRecvErrorNever
  395. case "private":
  396. f.sendRecvErrorConfig = sendRecvErrorPrivate
  397. default:
  398. if c.GetBool("listen.send_recv_error", true) {
  399. f.sendRecvErrorConfig = sendRecvErrorAlways
  400. } else {
  401. f.sendRecvErrorConfig = sendRecvErrorNever
  402. }
  403. }
  404. f.l.WithField("sendRecvError", f.sendRecvErrorConfig.String()).
  405. Info("Loaded send_recv_error config")
  406. }
  407. }
  408. func (f *Interface) reloadMisc(c *config.C) {
  409. if c.HasChanged("counters.try_promote") {
  410. n := c.GetUint32("counters.try_promote", defaultPromoteEvery)
  411. f.tryPromoteEvery.Store(n)
  412. f.l.Info("counters.try_promote has changed")
  413. }
  414. if c.HasChanged("counters.requery_every_packets") {
  415. n := c.GetUint32("counters.requery_every_packets", defaultReQueryEvery)
  416. f.reQueryEvery.Store(n)
  417. f.l.Info("counters.requery_every_packets has changed")
  418. }
  419. if c.HasChanged("timers.requery_wait_duration") {
  420. n := c.GetDuration("timers.requery_wait_duration", defaultReQueryWait)
  421. f.reQueryWait.Store(int64(n))
  422. f.l.Info("timers.requery_wait_duration has changed")
  423. }
  424. }
  425. func (f *Interface) emitStats(ctx context.Context, i time.Duration) {
  426. ticker := time.NewTicker(i)
  427. defer ticker.Stop()
  428. udpStats := udp.NewUDPStatsEmitter(f.writers)
  429. certExpirationGauge := metrics.GetOrRegisterGauge("certificate.ttl_seconds", nil)
  430. certInitiatingVersion := metrics.GetOrRegisterGauge("certificate.initiating_version", nil)
  431. certMaxVersion := metrics.GetOrRegisterGauge("certificate.max_version", nil)
  432. for {
  433. select {
  434. case <-ctx.Done():
  435. return
  436. case <-ticker.C:
  437. f.firewall.EmitStats()
  438. f.handshakeManager.EmitStats()
  439. udpStats()
  440. certState := f.pki.getCertState()
  441. defaultCrt := certState.GetDefaultCertificate()
  442. certExpirationGauge.Update(int64(defaultCrt.NotAfter().Sub(time.Now()) / time.Second))
  443. certInitiatingVersion.Update(int64(defaultCrt.Version()))
  444. // Report the max certificate version we are capable of using
  445. if certState.v2Cert != nil {
  446. certMaxVersion.Update(int64(certState.v2Cert.Version()))
  447. } else {
  448. certMaxVersion.Update(int64(certState.v1Cert.Version()))
  449. }
  450. }
  451. }
  452. }
  453. func (f *Interface) GetHostInfo(vpnIp netip.Addr) *HostInfo {
  454. return f.hostMap.QueryVpnAddr(vpnIp)
  455. }
  456. func (f *Interface) GetCertState() *CertState {
  457. return f.pki.getCertState()
  458. }
  459. func (f *Interface) Close() error {
  460. f.closed.Store(true)
  461. // Release the udp readers
  462. for _, u := range f.writers {
  463. err := u.Close()
  464. if err != nil {
  465. f.l.WithError(err).Error("Error while closing udp socket")
  466. }
  467. }
  468. // Release the tun readers
  469. for _, u := range f.readers {
  470. err := u.Close()
  471. if err != nil {
  472. f.l.WithError(err).Error("Error while closing tun device")
  473. }
  474. }
  475. return nil
  476. }