interface.go 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531
  1. package nebula
  2. import (
  3. "context"
  4. "errors"
  5. "fmt"
  6. "net/netip"
  7. "os"
  8. "runtime"
  9. "sync/atomic"
  10. "time"
  11. "github.com/gaissmai/bart"
  12. "github.com/rcrowley/go-metrics"
  13. "github.com/sirupsen/logrus"
  14. "github.com/slackhq/nebula/config"
  15. "github.com/slackhq/nebula/firewall"
  16. "github.com/slackhq/nebula/header"
  17. "github.com/slackhq/nebula/overlay"
  18. "github.com/slackhq/nebula/packet"
  19. "github.com/slackhq/nebula/udp"
  20. )
  21. const mtu = 9001
  22. const batch = 1024 //todo config!
  23. type InterfaceConfig struct {
  24. HostMap *HostMap
  25. Outside udp.Conn
  26. Inside overlay.Device
  27. pki *PKI
  28. Cipher string
  29. Firewall *Firewall
  30. ServeDns bool
  31. HandshakeManager *HandshakeManager
  32. lightHouse *LightHouse
  33. connectionManager *connectionManager
  34. DropLocalBroadcast bool
  35. DropMulticast bool
  36. routines int
  37. MessageMetrics *MessageMetrics
  38. version string
  39. relayManager *relayManager
  40. punchy *Punchy
  41. tryPromoteEvery uint32
  42. reQueryEvery uint32
  43. reQueryWait time.Duration
  44. ConntrackCacheTimeout time.Duration
  45. l *logrus.Logger
  46. }
  47. type Interface struct {
  48. hostMap *HostMap
  49. outside udp.Conn
  50. inside overlay.Device
  51. pki *PKI
  52. firewall *Firewall
  53. connectionManager *connectionManager
  54. handshakeManager *HandshakeManager
  55. serveDns bool
  56. createTime time.Time
  57. lightHouse *LightHouse
  58. myBroadcastAddrsTable *bart.Lite
  59. myVpnAddrs []netip.Addr // A list of addresses assigned to us via our certificate
  60. myVpnAddrsTable *bart.Lite
  61. myVpnNetworks []netip.Prefix // A list of networks assigned to us via our certificate
  62. myVpnNetworksTable *bart.Lite
  63. dropLocalBroadcast bool
  64. dropMulticast bool
  65. routines int
  66. disconnectInvalid atomic.Bool
  67. closed atomic.Bool
  68. relayManager *relayManager
  69. tryPromoteEvery atomic.Uint32
  70. reQueryEvery atomic.Uint32
  71. reQueryWait atomic.Int64
  72. sendRecvErrorConfig sendRecvErrorConfig
  73. // rebindCount is used to decide if an active tunnel should trigger a punch notification through a lighthouse
  74. rebindCount int8
  75. version string
  76. conntrackCacheTimeout time.Duration
  77. writers []udp.Conn
  78. readers []overlay.TunDev
  79. metricHandshakes metrics.Histogram
  80. messageMetrics *MessageMetrics
  81. cachedPacketMetrics *cachedPacketMetrics
  82. listenInN int
  83. listenOutN int
  84. listenInMetric metrics.Histogram
  85. listenOutMetric metrics.Histogram
  86. l *logrus.Logger
  87. }
  88. type EncWriter interface {
  89. SendVia(via *HostInfo,
  90. relay *Relay,
  91. ad,
  92. nb,
  93. out []byte,
  94. nocopy bool,
  95. )
  96. SendMessageToVpnAddr(t header.MessageType, st header.MessageSubType, vpnAddr netip.Addr, p, nb, out []byte)
  97. SendMessageToHostInfo(t header.MessageType, st header.MessageSubType, hostinfo *HostInfo, p, nb, out []byte)
  98. Handshake(vpnAddr netip.Addr)
  99. GetHostInfo(vpnAddr netip.Addr) *HostInfo
  100. GetCertState() *CertState
  101. }
  102. type sendRecvErrorConfig uint8
  103. const (
  104. sendRecvErrorAlways sendRecvErrorConfig = iota
  105. sendRecvErrorNever
  106. sendRecvErrorPrivate
  107. )
  108. func (s sendRecvErrorConfig) ShouldSendRecvError(endpoint netip.AddrPort) bool {
  109. switch s {
  110. case sendRecvErrorPrivate:
  111. return endpoint.Addr().IsPrivate()
  112. case sendRecvErrorAlways:
  113. return true
  114. case sendRecvErrorNever:
  115. return false
  116. default:
  117. panic(fmt.Errorf("invalid sendRecvErrorConfig value: %d", s))
  118. }
  119. }
  120. func (s sendRecvErrorConfig) String() string {
  121. switch s {
  122. case sendRecvErrorAlways:
  123. return "always"
  124. case sendRecvErrorNever:
  125. return "never"
  126. case sendRecvErrorPrivate:
  127. return "private"
  128. default:
  129. return fmt.Sprintf("invalid(%d)", s)
  130. }
  131. }
  132. func NewInterface(ctx context.Context, c *InterfaceConfig) (*Interface, error) {
  133. if c.Outside == nil {
  134. return nil, errors.New("no outside connection")
  135. }
  136. if c.Inside == nil {
  137. return nil, errors.New("no inside interface (tun)")
  138. }
  139. if c.pki == nil {
  140. return nil, errors.New("no certificate state")
  141. }
  142. if c.Firewall == nil {
  143. return nil, errors.New("no firewall rules")
  144. }
  145. if c.connectionManager == nil {
  146. return nil, errors.New("no connection manager")
  147. }
  148. cs := c.pki.getCertState()
  149. ifce := &Interface{
  150. pki: c.pki,
  151. hostMap: c.HostMap,
  152. outside: c.Outside,
  153. inside: c.Inside,
  154. firewall: c.Firewall,
  155. serveDns: c.ServeDns,
  156. handshakeManager: c.HandshakeManager,
  157. createTime: time.Now(),
  158. lightHouse: c.lightHouse,
  159. dropLocalBroadcast: c.DropLocalBroadcast,
  160. dropMulticast: c.DropMulticast,
  161. routines: c.routines,
  162. version: c.version,
  163. writers: make([]udp.Conn, c.routines),
  164. readers: make([]overlay.TunDev, c.routines),
  165. myVpnNetworks: cs.myVpnNetworks,
  166. myVpnNetworksTable: cs.myVpnNetworksTable,
  167. myVpnAddrs: cs.myVpnAddrs,
  168. myVpnAddrsTable: cs.myVpnAddrsTable,
  169. myBroadcastAddrsTable: cs.myVpnBroadcastAddrsTable,
  170. relayManager: c.relayManager,
  171. connectionManager: c.connectionManager,
  172. conntrackCacheTimeout: c.ConntrackCacheTimeout,
  173. metricHandshakes: metrics.GetOrRegisterHistogram("handshakes", nil, metrics.NewExpDecaySample(1028, 0.015)),
  174. messageMetrics: c.MessageMetrics,
  175. cachedPacketMetrics: &cachedPacketMetrics{
  176. sent: metrics.GetOrRegisterCounter("hostinfo.cached_packets.sent", nil),
  177. dropped: metrics.GetOrRegisterCounter("hostinfo.cached_packets.dropped", nil),
  178. },
  179. l: c.l,
  180. }
  181. ifce.listenInMetric = metrics.GetOrRegisterHistogram("vhost.listenIn.n", nil, metrics.NewExpDecaySample(1028, 0.015))
  182. ifce.listenOutMetric = metrics.GetOrRegisterHistogram("vhost.listenOut.n", nil, metrics.NewExpDecaySample(1028, 0.015))
  183. ifce.tryPromoteEvery.Store(c.tryPromoteEvery)
  184. ifce.reQueryEvery.Store(c.reQueryEvery)
  185. ifce.reQueryWait.Store(int64(c.reQueryWait))
  186. ifce.connectionManager.intf = ifce
  187. return ifce, nil
  188. }
  189. // activate creates the interface on the host. After the interface is created, any
  190. // other services that want to bind listeners to its IP may do so successfully. However,
  191. // the interface isn't going to process anything until run() is called.
  192. func (f *Interface) activate() {
  193. // actually turn on tun dev
  194. addr, err := f.outside.LocalAddr()
  195. if err != nil {
  196. f.l.WithError(err).Error("Failed to get udp listen address")
  197. }
  198. f.l.WithField("interface", f.inside.Name()).WithField("networks", f.myVpnNetworks).
  199. WithField("build", f.version).WithField("udpAddr", addr).
  200. WithField("boringcrypto", boringEnabled()).
  201. Info("Nebula interface is active")
  202. if f.routines > 1 {
  203. if !f.inside.SupportsMultiqueue() || !f.outside.SupportsMultipleReaders() {
  204. f.routines = 1
  205. f.l.Warn("routines is not supported on this platform, falling back to a single routine")
  206. }
  207. }
  208. metrics.GetOrRegisterGauge("routines", nil).Update(int64(f.routines))
  209. // Prepare n tun queues
  210. var reader overlay.TunDev = f.inside
  211. for i := 0; i < f.routines; i++ {
  212. if i > 0 {
  213. reader, err = f.inside.NewMultiQueueReader()
  214. if err != nil {
  215. f.l.Fatal(err)
  216. }
  217. }
  218. f.readers[i] = reader
  219. }
  220. if err := f.inside.Activate(); err != nil {
  221. f.inside.Close()
  222. f.l.Fatal(err)
  223. }
  224. }
  225. func (f *Interface) run() {
  226. // Launch n queues to read packets from udp
  227. for i := 0; i < f.routines; i++ {
  228. go f.listenOut(i)
  229. }
  230. // Launch n queues to read packets from tun dev
  231. for i := 0; i < f.routines; i++ {
  232. go f.listenIn(f.readers[i], i)
  233. }
  234. }
  235. func (f *Interface) listenOut(q int) {
  236. runtime.LockOSThread()
  237. var li udp.Conn
  238. if q > 0 {
  239. li = f.writers[q]
  240. } else {
  241. li = f.outside
  242. }
  243. ctCache := firewall.NewConntrackCacheTicker(f.conntrackCacheTimeout)
  244. lhh := f.lightHouse.NewRequestHandler()
  245. outPackets := make([]*packet.OutPacket, batch)
  246. for i := 0; i < batch; i++ {
  247. outPackets[i] = packet.NewOut()
  248. }
  249. h := &header.H{}
  250. fwPacket := &firewall.Packet{}
  251. nb := make([]byte, 12, 12)
  252. toSend := make([][]byte, batch)
  253. li.ListenOut(func(pkts []*packet.Packet) {
  254. toSend = toSend[:0]
  255. for i := range outPackets {
  256. outPackets[i].Valid = false
  257. outPackets[i].SegCounter = 0
  258. }
  259. //todo f.readOutsidePackets(ViaSender{UdpAddr: fromUdpAddr}, plaintext[:0], payload, h, fwPacket, lhh, nb, i, ctCache.Get(f.l))
  260. f.readOutsidePacketsMany(pkts, outPackets, h, fwPacket, lhh, nb, q, ctCache.Get(f.l), time.Now())
  261. //we opportunistically tx, but try to also send stragglers
  262. if _, err := f.readers[q].WriteMany(outPackets, q); err != nil {
  263. f.l.WithError(err).Error("Failed to send packets")
  264. }
  265. //todo I broke this
  266. //n := len(toSend)
  267. //if f.l.Level == logrus.DebugLevel {
  268. // f.listenOutMetric.Update(int64(n))
  269. //}
  270. //f.listenOutN = n
  271. })
  272. }
  273. func (f *Interface) listenIn(reader overlay.TunDev, queueNum int) {
  274. runtime.LockOSThread()
  275. fwPacket := &firewall.Packet{}
  276. nb := make([]byte, 12, 12)
  277. conntrackCache := firewall.NewConntrackCacheTicker(f.conntrackCacheTimeout)
  278. packets := make([]*packet.VirtIOPacket, batch)
  279. outPackets := make([]*packet.Packet, batch)
  280. for i := 0; i < batch; i++ {
  281. packets[i] = packet.NewVIO()
  282. outPackets[i] = packet.New(false) //todo?
  283. }
  284. for {
  285. n, err := reader.ReadMany(packets, queueNum)
  286. //todo!!
  287. if err != nil {
  288. if errors.Is(err, os.ErrClosed) && f.closed.Load() {
  289. return
  290. }
  291. f.l.WithError(err).Error("Error while reading outbound packet")
  292. // This only seems to happen when something fatal happens to the fd, so exit.
  293. os.Exit(2)
  294. }
  295. if f.l.Level == logrus.DebugLevel {
  296. f.listenInMetric.Update(int64(n))
  297. }
  298. f.listenInN = n
  299. now := time.Now()
  300. for i, pkt := range packets[:n] {
  301. outPackets[i].OutLen = -1
  302. f.consumeInsidePacket(pkt.Payload, fwPacket, nb, outPackets[i], queueNum, conntrackCache.Get(f.l), now)
  303. reader.RecycleRxSeg(pkt, i == (n-1), queueNum) //todo handle err?
  304. pkt.Reset()
  305. }
  306. _, err = f.writers[queueNum].WriteBatch(outPackets[:n])
  307. if err != nil {
  308. f.l.WithError(err).Error("Error while writing outbound packets")
  309. }
  310. }
  311. }
  312. func (f *Interface) RegisterConfigChangeCallbacks(c *config.C) {
  313. c.RegisterReloadCallback(f.reloadFirewall)
  314. c.RegisterReloadCallback(f.reloadSendRecvError)
  315. c.RegisterReloadCallback(f.reloadDisconnectInvalid)
  316. c.RegisterReloadCallback(f.reloadMisc)
  317. for _, udpConn := range f.writers {
  318. c.RegisterReloadCallback(udpConn.ReloadConfig)
  319. }
  320. }
  321. func (f *Interface) reloadDisconnectInvalid(c *config.C) {
  322. initial := c.InitialLoad()
  323. if initial || c.HasChanged("pki.disconnect_invalid") {
  324. f.disconnectInvalid.Store(c.GetBool("pki.disconnect_invalid", true))
  325. if !initial {
  326. f.l.Infof("pki.disconnect_invalid changed to %v", f.disconnectInvalid.Load())
  327. }
  328. }
  329. }
  330. func (f *Interface) reloadFirewall(c *config.C) {
  331. //TODO: need to trigger/detect if the certificate changed too
  332. if c.HasChanged("firewall") == false {
  333. f.l.Debug("No firewall config change detected")
  334. return
  335. }
  336. fw, err := NewFirewallFromConfig(f.l, f.pki.getCertState(), c)
  337. if err != nil {
  338. f.l.WithError(err).Error("Error while creating firewall during reload")
  339. return
  340. }
  341. oldFw := f.firewall
  342. conntrack := oldFw.Conntrack
  343. conntrack.Lock()
  344. defer conntrack.Unlock()
  345. fw.rulesVersion = oldFw.rulesVersion + 1
  346. // If rulesVersion is back to zero, we have wrapped all the way around. Be
  347. // safe and just reset conntrack in this case.
  348. if fw.rulesVersion == 0 {
  349. f.l.WithField("firewallHashes", fw.GetRuleHashes()).
  350. WithField("oldFirewallHashes", oldFw.GetRuleHashes()).
  351. WithField("rulesVersion", fw.rulesVersion).
  352. Warn("firewall rulesVersion has overflowed, resetting conntrack")
  353. } else {
  354. fw.Conntrack = conntrack
  355. }
  356. f.firewall = fw
  357. oldFw.Destroy()
  358. f.l.WithField("firewallHashes", fw.GetRuleHashes()).
  359. WithField("oldFirewallHashes", oldFw.GetRuleHashes()).
  360. WithField("rulesVersion", fw.rulesVersion).
  361. Info("New firewall has been installed")
  362. }
  363. func (f *Interface) reloadSendRecvError(c *config.C) {
  364. if c.InitialLoad() || c.HasChanged("listen.send_recv_error") {
  365. stringValue := c.GetString("listen.send_recv_error", "always")
  366. switch stringValue {
  367. case "always":
  368. f.sendRecvErrorConfig = sendRecvErrorAlways
  369. case "never":
  370. f.sendRecvErrorConfig = sendRecvErrorNever
  371. case "private":
  372. f.sendRecvErrorConfig = sendRecvErrorPrivate
  373. default:
  374. if c.GetBool("listen.send_recv_error", true) {
  375. f.sendRecvErrorConfig = sendRecvErrorAlways
  376. } else {
  377. f.sendRecvErrorConfig = sendRecvErrorNever
  378. }
  379. }
  380. f.l.WithField("sendRecvError", f.sendRecvErrorConfig.String()).
  381. Info("Loaded send_recv_error config")
  382. }
  383. }
  384. func (f *Interface) reloadMisc(c *config.C) {
  385. if c.HasChanged("counters.try_promote") {
  386. n := c.GetUint32("counters.try_promote", defaultPromoteEvery)
  387. f.tryPromoteEvery.Store(n)
  388. f.l.Info("counters.try_promote has changed")
  389. }
  390. if c.HasChanged("counters.requery_every_packets") {
  391. n := c.GetUint32("counters.requery_every_packets", defaultReQueryEvery)
  392. f.reQueryEvery.Store(n)
  393. f.l.Info("counters.requery_every_packets has changed")
  394. }
  395. if c.HasChanged("timers.requery_wait_duration") {
  396. n := c.GetDuration("timers.requery_wait_duration", defaultReQueryWait)
  397. f.reQueryWait.Store(int64(n))
  398. f.l.Info("timers.requery_wait_duration has changed")
  399. }
  400. }
  401. func (f *Interface) emitStats(ctx context.Context, i time.Duration) {
  402. ticker := time.NewTicker(i)
  403. defer ticker.Stop()
  404. udpStats := udp.NewUDPStatsEmitter(f.writers)
  405. certExpirationGauge := metrics.GetOrRegisterGauge("certificate.ttl_seconds", nil)
  406. certInitiatingVersion := metrics.GetOrRegisterGauge("certificate.initiating_version", nil)
  407. certMaxVersion := metrics.GetOrRegisterGauge("certificate.max_version", nil)
  408. for {
  409. select {
  410. case <-ctx.Done():
  411. return
  412. case <-ticker.C:
  413. f.firewall.EmitStats()
  414. f.handshakeManager.EmitStats()
  415. udpStats()
  416. certState := f.pki.getCertState()
  417. defaultCrt := certState.GetDefaultCertificate()
  418. certExpirationGauge.Update(int64(defaultCrt.NotAfter().Sub(time.Now()) / time.Second))
  419. certInitiatingVersion.Update(int64(defaultCrt.Version()))
  420. // Report the max certificate version we are capable of using
  421. if certState.v2Cert != nil {
  422. certMaxVersion.Update(int64(certState.v2Cert.Version()))
  423. } else {
  424. certMaxVersion.Update(int64(certState.v1Cert.Version()))
  425. }
  426. if f.l.Level != logrus.DebugLevel {
  427. f.listenInMetric.Update(int64(f.listenInN))
  428. f.listenOutMetric.Update(int64(f.listenOutN))
  429. }
  430. }
  431. }
  432. }
  433. func (f *Interface) GetHostInfo(vpnIp netip.Addr) *HostInfo {
  434. return f.hostMap.QueryVpnAddr(vpnIp)
  435. }
  436. func (f *Interface) GetCertState() *CertState {
  437. return f.pki.getCertState()
  438. }
  439. func (f *Interface) Close() error {
  440. f.closed.Store(true)
  441. for _, u := range f.writers {
  442. err := u.Close()
  443. if err != nil {
  444. f.l.WithError(err).Error("Error while closing udp socket")
  445. }
  446. }
  447. // Release the tun device
  448. return f.inside.Close()
  449. }