interface.go 8.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327
  1. package nebula
  2. import (
  3. "context"
  4. "errors"
  5. "io"
  6. "net"
  7. "os"
  8. "runtime"
  9. "time"
  10. "github.com/rcrowley/go-metrics"
  11. "github.com/sirupsen/logrus"
  12. "github.com/slackhq/nebula/cert"
  13. "github.com/slackhq/nebula/config"
  14. "github.com/slackhq/nebula/firewall"
  15. "github.com/slackhq/nebula/iputil"
  16. "github.com/slackhq/nebula/udp"
  17. )
  18. const mtu = 9001
  19. type Inside interface {
  20. io.ReadWriteCloser
  21. Activate() error
  22. CidrNet() *net.IPNet
  23. DeviceName() string
  24. WriteRaw([]byte) error
  25. NewMultiQueueReader() (io.ReadWriteCloser, error)
  26. }
  27. type InterfaceConfig struct {
  28. HostMap *HostMap
  29. Outside *udp.Conn
  30. Inside Inside
  31. certState *CertState
  32. Cipher string
  33. Firewall *Firewall
  34. ServeDns bool
  35. HandshakeManager *HandshakeManager
  36. lightHouse *LightHouse
  37. checkInterval int
  38. pendingDeletionInterval int
  39. DropLocalBroadcast bool
  40. DropMulticast bool
  41. routines int
  42. MessageMetrics *MessageMetrics
  43. version string
  44. caPool *cert.NebulaCAPool
  45. disconnectInvalid bool
  46. ConntrackCacheTimeout time.Duration
  47. l *logrus.Logger
  48. }
  49. type Interface struct {
  50. hostMap *HostMap
  51. outside *udp.Conn
  52. inside Inside
  53. certState *CertState
  54. cipher string
  55. firewall *Firewall
  56. connectionManager *connectionManager
  57. handshakeManager *HandshakeManager
  58. serveDns bool
  59. createTime time.Time
  60. lightHouse *LightHouse
  61. localBroadcast iputil.VpnIp
  62. myVpnIp iputil.VpnIp
  63. dropLocalBroadcast bool
  64. dropMulticast bool
  65. routines int
  66. caPool *cert.NebulaCAPool
  67. disconnectInvalid bool
  68. // rebindCount is used to decide if an active tunnel should trigger a punch notification through a lighthouse
  69. rebindCount int8
  70. version string
  71. conntrackCacheTimeout time.Duration
  72. writers []*udp.Conn
  73. readers []io.ReadWriteCloser
  74. metricHandshakes metrics.Histogram
  75. messageMetrics *MessageMetrics
  76. cachedPacketMetrics *cachedPacketMetrics
  77. l *logrus.Logger
  78. }
  79. func NewInterface(ctx context.Context, c *InterfaceConfig) (*Interface, error) {
  80. if c.Outside == nil {
  81. return nil, errors.New("no outside connection")
  82. }
  83. if c.Inside == nil {
  84. return nil, errors.New("no inside interface (tun)")
  85. }
  86. if c.certState == nil {
  87. return nil, errors.New("no certificate state")
  88. }
  89. if c.Firewall == nil {
  90. return nil, errors.New("no firewall rules")
  91. }
  92. myVpnIp := iputil.Ip2VpnIp(c.certState.certificate.Details.Ips[0].IP)
  93. ifce := &Interface{
  94. hostMap: c.HostMap,
  95. outside: c.Outside,
  96. inside: c.Inside,
  97. certState: c.certState,
  98. cipher: c.Cipher,
  99. firewall: c.Firewall,
  100. serveDns: c.ServeDns,
  101. handshakeManager: c.HandshakeManager,
  102. createTime: time.Now(),
  103. lightHouse: c.lightHouse,
  104. localBroadcast: myVpnIp | ^iputil.Ip2VpnIp(c.certState.certificate.Details.Ips[0].Mask),
  105. dropLocalBroadcast: c.DropLocalBroadcast,
  106. dropMulticast: c.DropMulticast,
  107. routines: c.routines,
  108. version: c.version,
  109. writers: make([]*udp.Conn, c.routines),
  110. readers: make([]io.ReadWriteCloser, c.routines),
  111. caPool: c.caPool,
  112. disconnectInvalid: c.disconnectInvalid,
  113. myVpnIp: myVpnIp,
  114. conntrackCacheTimeout: c.ConntrackCacheTimeout,
  115. metricHandshakes: metrics.GetOrRegisterHistogram("handshakes", nil, metrics.NewExpDecaySample(1028, 0.015)),
  116. messageMetrics: c.MessageMetrics,
  117. cachedPacketMetrics: &cachedPacketMetrics{
  118. sent: metrics.GetOrRegisterCounter("hostinfo.cached_packets.sent", nil),
  119. dropped: metrics.GetOrRegisterCounter("hostinfo.cached_packets.dropped", nil),
  120. },
  121. l: c.l,
  122. }
  123. ifce.connectionManager = newConnectionManager(ctx, c.l, ifce, c.checkInterval, c.pendingDeletionInterval)
  124. return ifce, nil
  125. }
  126. // activate creates the interface on the host. After the interface is created, any
  127. // other services that want to bind listeners to its IP may do so successfully. However,
  128. // the interface isn't going to process anything until run() is called.
  129. func (f *Interface) activate() {
  130. // actually turn on tun dev
  131. addr, err := f.outside.LocalAddr()
  132. if err != nil {
  133. f.l.WithError(err).Error("Failed to get udp listen address")
  134. }
  135. f.l.WithField("interface", f.inside.DeviceName()).WithField("network", f.inside.CidrNet().String()).
  136. WithField("build", f.version).WithField("udpAddr", addr).
  137. Info("Nebula interface is active")
  138. metrics.GetOrRegisterGauge("routines", nil).Update(int64(f.routines))
  139. // Prepare n tun queues
  140. var reader io.ReadWriteCloser = f.inside
  141. for i := 0; i < f.routines; i++ {
  142. if i > 0 {
  143. reader, err = f.inside.NewMultiQueueReader()
  144. if err != nil {
  145. f.l.Fatal(err)
  146. }
  147. }
  148. f.readers[i] = reader
  149. }
  150. if err := f.inside.Activate(); err != nil {
  151. f.l.Fatal(err)
  152. }
  153. }
  154. func (f *Interface) run() {
  155. // Launch n queues to read packets from udp
  156. for i := 0; i < f.routines; i++ {
  157. go f.listenOut(i)
  158. }
  159. // Launch n queues to read packets from tun dev
  160. for i := 0; i < f.routines; i++ {
  161. go f.listenIn(f.readers[i], i)
  162. }
  163. }
  164. func (f *Interface) listenOut(i int) {
  165. runtime.LockOSThread()
  166. var li *udp.Conn
  167. // TODO clean this up with a coherent interface for each outside connection
  168. if i > 0 {
  169. li = f.writers[i]
  170. } else {
  171. li = f.outside
  172. }
  173. lhh := f.lightHouse.NewRequestHandler()
  174. conntrackCache := firewall.NewConntrackCacheTicker(f.conntrackCacheTimeout)
  175. li.ListenOut(f.readOutsidePackets, lhh.HandleRequest, conntrackCache, i)
  176. }
  177. func (f *Interface) listenIn(reader io.ReadWriteCloser, i int) {
  178. runtime.LockOSThread()
  179. packet := make([]byte, mtu)
  180. out := make([]byte, mtu)
  181. fwPacket := &firewall.Packet{}
  182. nb := make([]byte, 12, 12)
  183. conntrackCache := firewall.NewConntrackCacheTicker(f.conntrackCacheTimeout)
  184. for {
  185. n, err := reader.Read(packet)
  186. if err != nil {
  187. f.l.WithError(err).Error("Error while reading outbound packet")
  188. // This only seems to happen when something fatal happens to the fd, so exit.
  189. os.Exit(2)
  190. }
  191. f.consumeInsidePacket(packet[:n], fwPacket, nb, out, i, conntrackCache.Get(f.l))
  192. }
  193. }
  194. func (f *Interface) RegisterConfigChangeCallbacks(c *config.C) {
  195. c.RegisterReloadCallback(f.reloadCA)
  196. c.RegisterReloadCallback(f.reloadCertKey)
  197. c.RegisterReloadCallback(f.reloadFirewall)
  198. for _, udpConn := range f.writers {
  199. c.RegisterReloadCallback(udpConn.ReloadConfig)
  200. }
  201. }
  202. func (f *Interface) reloadCA(c *config.C) {
  203. // reload and check regardless
  204. // todo: need mutex?
  205. newCAs, err := loadCAFromConfig(f.l, c)
  206. if err != nil {
  207. f.l.WithError(err).Error("Could not refresh trusted CA certificates")
  208. return
  209. }
  210. f.caPool = newCAs
  211. f.l.WithField("fingerprints", f.caPool.GetFingerprints()).Info("Trusted CA certificates refreshed")
  212. }
  213. func (f *Interface) reloadCertKey(c *config.C) {
  214. // reload and check in all cases
  215. cs, err := NewCertStateFromConfig(c)
  216. if err != nil {
  217. f.l.WithError(err).Error("Could not refresh client cert")
  218. return
  219. }
  220. // did IP in cert change? if so, don't set
  221. oldIPs := f.certState.certificate.Details.Ips
  222. newIPs := cs.certificate.Details.Ips
  223. if len(oldIPs) > 0 && len(newIPs) > 0 && oldIPs[0].String() != newIPs[0].String() {
  224. f.l.WithField("new_ip", newIPs[0]).WithField("old_ip", oldIPs[0]).Error("IP in new cert was different from old")
  225. return
  226. }
  227. f.certState = cs
  228. f.l.WithField("cert", cs.certificate).Info("Client cert refreshed from disk")
  229. }
  230. func (f *Interface) reloadFirewall(c *config.C) {
  231. //TODO: need to trigger/detect if the certificate changed too
  232. if c.HasChanged("firewall") == false {
  233. f.l.Debug("No firewall config change detected")
  234. return
  235. }
  236. fw, err := NewFirewallFromConfig(f.l, f.certState.certificate, c)
  237. if err != nil {
  238. f.l.WithError(err).Error("Error while creating firewall during reload")
  239. return
  240. }
  241. oldFw := f.firewall
  242. conntrack := oldFw.Conntrack
  243. conntrack.Lock()
  244. defer conntrack.Unlock()
  245. fw.rulesVersion = oldFw.rulesVersion + 1
  246. // If rulesVersion is back to zero, we have wrapped all the way around. Be
  247. // safe and just reset conntrack in this case.
  248. if fw.rulesVersion == 0 {
  249. f.l.WithField("firewallHash", fw.GetRuleHash()).
  250. WithField("oldFirewallHash", oldFw.GetRuleHash()).
  251. WithField("rulesVersion", fw.rulesVersion).
  252. Warn("firewall rulesVersion has overflowed, resetting conntrack")
  253. } else {
  254. fw.Conntrack = conntrack
  255. }
  256. f.firewall = fw
  257. oldFw.Destroy()
  258. f.l.WithField("firewallHash", fw.GetRuleHash()).
  259. WithField("oldFirewallHash", oldFw.GetRuleHash()).
  260. WithField("rulesVersion", fw.rulesVersion).
  261. Info("New firewall has been installed")
  262. }
  263. func (f *Interface) emitStats(ctx context.Context, i time.Duration) {
  264. ticker := time.NewTicker(i)
  265. defer ticker.Stop()
  266. udpStats := udp.NewUDPStatsEmitter(f.writers)
  267. for {
  268. select {
  269. case <-ctx.Done():
  270. return
  271. case <-ticker.C:
  272. f.firewall.EmitStats()
  273. f.handshakeManager.EmitStats()
  274. udpStats()
  275. }
  276. }
  277. }