interface.go 9.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346
  1. package nebula
  2. import (
  3. "context"
  4. "errors"
  5. "io"
  6. "net"
  7. "os"
  8. "runtime"
  9. "sync/atomic"
  10. "time"
  11. "unsafe"
  12. "github.com/rcrowley/go-metrics"
  13. "github.com/sirupsen/logrus"
  14. "github.com/slackhq/nebula/cert"
  15. "github.com/slackhq/nebula/config"
  16. "github.com/slackhq/nebula/firewall"
  17. "github.com/slackhq/nebula/iputil"
  18. "github.com/slackhq/nebula/udp"
  19. )
  20. const mtu = 9001
  21. type Inside interface {
  22. io.ReadWriteCloser
  23. Activate() error
  24. CidrNet() *net.IPNet
  25. DeviceName() string
  26. WriteRaw([]byte) error
  27. NewMultiQueueReader() (io.ReadWriteCloser, error)
  28. }
  29. type InterfaceConfig struct {
  30. HostMap *HostMap
  31. Outside *udp.Conn
  32. Inside Inside
  33. certState *CertState
  34. Cipher string
  35. Firewall *Firewall
  36. ServeDns bool
  37. HandshakeManager *HandshakeManager
  38. lightHouse *LightHouse
  39. checkInterval int
  40. pendingDeletionInterval int
  41. DropLocalBroadcast bool
  42. DropMulticast bool
  43. routines int
  44. MessageMetrics *MessageMetrics
  45. version string
  46. caPool *cert.NebulaCAPool
  47. disconnectInvalid bool
  48. psk *Psk
  49. ConntrackCacheTimeout time.Duration
  50. l *logrus.Logger
  51. }
  52. type Interface struct {
  53. hostMap *HostMap
  54. outside *udp.Conn
  55. inside Inside
  56. certState *CertState
  57. cipher string
  58. firewall *Firewall
  59. connectionManager *connectionManager
  60. handshakeManager *HandshakeManager
  61. serveDns bool
  62. createTime time.Time
  63. lightHouse *LightHouse
  64. localBroadcast iputil.VpnIp
  65. myVpnIp iputil.VpnIp
  66. dropLocalBroadcast bool
  67. dropMulticast bool
  68. routines int
  69. caPool *cert.NebulaCAPool
  70. disconnectInvalid bool
  71. // rebindCount is used to decide if an active tunnel should trigger a punch notification through a lighthouse
  72. rebindCount int8
  73. version string
  74. conntrackCacheTimeout time.Duration
  75. psk *Psk
  76. writers []*udp.Conn
  77. readers []io.ReadWriteCloser
  78. metricHandshakes metrics.Histogram
  79. messageMetrics *MessageMetrics
  80. cachedPacketMetrics *cachedPacketMetrics
  81. l *logrus.Logger
  82. }
  83. func NewInterface(ctx context.Context, c *InterfaceConfig) (*Interface, error) {
  84. if c.Outside == nil {
  85. return nil, errors.New("no outside connection")
  86. }
  87. if c.Inside == nil {
  88. return nil, errors.New("no inside interface (tun)")
  89. }
  90. if c.certState == nil {
  91. return nil, errors.New("no certificate state")
  92. }
  93. if c.Firewall == nil {
  94. return nil, errors.New("no firewall rules")
  95. }
  96. myVpnIp := iputil.Ip2VpnIp(c.certState.certificate.Details.Ips[0].IP)
  97. ifce := &Interface{
  98. hostMap: c.HostMap,
  99. outside: c.Outside,
  100. inside: c.Inside,
  101. certState: c.certState,
  102. cipher: c.Cipher,
  103. firewall: c.Firewall,
  104. serveDns: c.ServeDns,
  105. handshakeManager: c.HandshakeManager,
  106. createTime: time.Now(),
  107. lightHouse: c.lightHouse,
  108. localBroadcast: myVpnIp | ^iputil.Ip2VpnIp(c.certState.certificate.Details.Ips[0].Mask),
  109. dropLocalBroadcast: c.DropLocalBroadcast,
  110. dropMulticast: c.DropMulticast,
  111. routines: c.routines,
  112. version: c.version,
  113. writers: make([]*udp.Conn, c.routines),
  114. readers: make([]io.ReadWriteCloser, c.routines),
  115. caPool: c.caPool,
  116. disconnectInvalid: c.disconnectInvalid,
  117. psk: c.psk,
  118. myVpnIp: myVpnIp,
  119. conntrackCacheTimeout: c.ConntrackCacheTimeout,
  120. metricHandshakes: metrics.GetOrRegisterHistogram("handshakes", nil, metrics.NewExpDecaySample(1028, 0.015)),
  121. messageMetrics: c.MessageMetrics,
  122. cachedPacketMetrics: &cachedPacketMetrics{
  123. sent: metrics.GetOrRegisterCounter("hostinfo.cached_packets.sent", nil),
  124. dropped: metrics.GetOrRegisterCounter("hostinfo.cached_packets.dropped", nil),
  125. },
  126. l: c.l,
  127. }
  128. ifce.connectionManager = newConnectionManager(ctx, c.l, ifce, c.checkInterval, c.pendingDeletionInterval)
  129. return ifce, nil
  130. }
  131. // activate creates the interface on the host. After the interface is created, any
  132. // other services that want to bind listeners to its IP may do so successfully. However,
  133. // the interface isn't going to process anything until run() is called.
  134. func (f *Interface) activate() {
  135. // actually turn on tun dev
  136. addr, err := f.outside.LocalAddr()
  137. if err != nil {
  138. f.l.WithError(err).Error("Failed to get udp listen address")
  139. }
  140. f.l.WithField("interface", f.inside.DeviceName()).WithField("network", f.inside.CidrNet().String()).
  141. WithField("build", f.version).WithField("udpAddr", addr).
  142. Info("Nebula interface is active")
  143. metrics.GetOrRegisterGauge("routines", nil).Update(int64(f.routines))
  144. // Prepare n tun queues
  145. var reader io.ReadWriteCloser = f.inside
  146. for i := 0; i < f.routines; i++ {
  147. if i > 0 {
  148. reader, err = f.inside.NewMultiQueueReader()
  149. if err != nil {
  150. f.l.Fatal(err)
  151. }
  152. }
  153. f.readers[i] = reader
  154. }
  155. if err := f.inside.Activate(); err != nil {
  156. f.l.Fatal(err)
  157. }
  158. }
  159. func (f *Interface) run() {
  160. // Launch n queues to read packets from udp
  161. for i := 0; i < f.routines; i++ {
  162. go f.listenOut(i)
  163. }
  164. // Launch n queues to read packets from tun dev
  165. for i := 0; i < f.routines; i++ {
  166. go f.listenIn(f.readers[i], i)
  167. }
  168. }
  169. func (f *Interface) listenOut(i int) {
  170. runtime.LockOSThread()
  171. var li *udp.Conn
  172. // TODO clean this up with a coherent interface for each outside connection
  173. if i > 0 {
  174. li = f.writers[i]
  175. } else {
  176. li = f.outside
  177. }
  178. lhh := f.lightHouse.NewRequestHandler()
  179. conntrackCache := firewall.NewConntrackCacheTicker(f.conntrackCacheTimeout)
  180. li.ListenOut(f.readOutsidePackets, lhh.HandleRequest, conntrackCache, i)
  181. }
  182. func (f *Interface) listenIn(reader io.ReadWriteCloser, i int) {
  183. runtime.LockOSThread()
  184. packet := make([]byte, mtu)
  185. out := make([]byte, mtu)
  186. fwPacket := &firewall.Packet{}
  187. nb := make([]byte, 12, 12)
  188. conntrackCache := firewall.NewConntrackCacheTicker(f.conntrackCacheTimeout)
  189. for {
  190. n, err := reader.Read(packet)
  191. if err != nil {
  192. f.l.WithError(err).Error("Error while reading outbound packet")
  193. // This only seems to happen when something fatal happens to the fd, so exit.
  194. os.Exit(2)
  195. }
  196. f.consumeInsidePacket(packet[:n], fwPacket, nb, out, i, conntrackCache.Get(f.l))
  197. }
  198. }
  199. func (f *Interface) RegisterConfigChangeCallbacks(c *config.C) {
  200. c.RegisterReloadCallback(f.reloadCA)
  201. c.RegisterReloadCallback(f.reloadCertKey)
  202. c.RegisterReloadCallback(f.reloadFirewall)
  203. for _, udpConn := range f.writers {
  204. c.RegisterReloadCallback(udpConn.ReloadConfig)
  205. }
  206. c.RegisterReloadCallback(f.reloadPSKs)
  207. }
  208. func (f *Interface) reloadCA(c *config.C) {
  209. // reload and check regardless
  210. // todo: need mutex?
  211. newCAs, err := loadCAFromConfig(f.l, c)
  212. if err != nil {
  213. f.l.WithError(err).Error("Could not refresh trusted CA certificates")
  214. return
  215. }
  216. f.caPool = newCAs
  217. f.l.WithField("fingerprints", f.caPool.GetFingerprints()).Info("Trusted CA certificates refreshed")
  218. }
  219. func (f *Interface) reloadCertKey(c *config.C) {
  220. // reload and check in all cases
  221. cs, err := NewCertStateFromConfig(c)
  222. if err != nil {
  223. f.l.WithError(err).Error("Could not refresh client cert")
  224. return
  225. }
  226. // did IP in cert change? if so, don't set
  227. oldIPs := f.certState.certificate.Details.Ips
  228. newIPs := cs.certificate.Details.Ips
  229. if len(oldIPs) > 0 && len(newIPs) > 0 && oldIPs[0].String() != newIPs[0].String() {
  230. f.l.WithField("new_ip", newIPs[0]).WithField("old_ip", oldIPs[0]).Error("IP in new cert was different from old")
  231. return
  232. }
  233. f.certState = cs
  234. f.l.WithField("cert", cs.certificate).Info("Client cert refreshed from disk")
  235. }
  236. func (f *Interface) reloadFirewall(c *config.C) {
  237. //TODO: need to trigger/detect if the certificate changed too
  238. if c.HasChanged("firewall") == false {
  239. f.l.Debug("No firewall config change detected")
  240. return
  241. }
  242. fw, err := NewFirewallFromConfig(f.l, f.certState.certificate, c)
  243. if err != nil {
  244. f.l.WithError(err).Error("Error while creating firewall during reload")
  245. return
  246. }
  247. oldFw := f.firewall
  248. conntrack := oldFw.Conntrack
  249. conntrack.Lock()
  250. defer conntrack.Unlock()
  251. fw.rulesVersion = oldFw.rulesVersion + 1
  252. // If rulesVersion is back to zero, we have wrapped all the way around. Be
  253. // safe and just reset conntrack in this case.
  254. if fw.rulesVersion == 0 {
  255. f.l.WithField("firewallHash", fw.GetRuleHash()).
  256. WithField("oldFirewallHash", oldFw.GetRuleHash()).
  257. WithField("rulesVersion", fw.rulesVersion).
  258. Warn("firewall rulesVersion has overflowed, resetting conntrack")
  259. } else {
  260. fw.Conntrack = conntrack
  261. }
  262. f.firewall = fw
  263. oldFw.Destroy()
  264. f.l.WithField("firewallHash", fw.GetRuleHash()).
  265. WithField("oldFirewallHash", oldFw.GetRuleHash()).
  266. WithField("rulesVersion", fw.rulesVersion).
  267. Info("New firewall has been installed")
  268. }
  269. func (f *Interface) reloadPSKs(c *config.C) {
  270. psk, err := NewPskFromConfig(c, f.myVpnIp)
  271. if err != nil {
  272. f.l.WithError(err).Error("Error while reloading PSKs")
  273. return
  274. }
  275. atomic.StorePointer((*unsafe.Pointer)(unsafe.Pointer(&f.psk)), unsafe.Pointer(psk))
  276. f.l.WithField("pskMode", psk.mode).WithField("keysLen", len(psk.Cache)).
  277. Info("New psks are in use")
  278. }
  279. func (f *Interface) emitStats(ctx context.Context, i time.Duration) {
  280. ticker := time.NewTicker(i)
  281. defer ticker.Stop()
  282. udpStats := udp.NewUDPStatsEmitter(f.writers)
  283. for {
  284. select {
  285. case <-ctx.Done():
  286. return
  287. case <-ticker.C:
  288. f.firewall.EmitStats()
  289. f.handshakeManager.EmitStats()
  290. udpStats()
  291. }
  292. }
  293. }