interface.go 8.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322
  1. package nebula
  2. import (
  3. "context"
  4. "errors"
  5. "io"
  6. "net"
  7. "os"
  8. "runtime"
  9. "time"
  10. "github.com/rcrowley/go-metrics"
  11. "github.com/sirupsen/logrus"
  12. "github.com/slackhq/nebula/cert"
  13. )
  14. const mtu = 9001
  15. type Inside interface {
  16. io.ReadWriteCloser
  17. Activate() error
  18. CidrNet() *net.IPNet
  19. DeviceName() string
  20. WriteRaw([]byte) error
  21. NewMultiQueueReader() (io.ReadWriteCloser, error)
  22. }
  23. type InterfaceConfig struct {
  24. HostMap *HostMap
  25. Outside *udpConn
  26. Inside Inside
  27. certState *CertState
  28. Cipher string
  29. Firewall *Firewall
  30. ServeDns bool
  31. HandshakeManager *HandshakeManager
  32. lightHouse *LightHouse
  33. checkInterval int
  34. pendingDeletionInterval int
  35. DropLocalBroadcast bool
  36. DropMulticast bool
  37. UDPBatchSize int
  38. routines int
  39. MessageMetrics *MessageMetrics
  40. version string
  41. caPool *cert.NebulaCAPool
  42. disconnectInvalid bool
  43. ConntrackCacheTimeout time.Duration
  44. l *logrus.Logger
  45. }
  46. type Interface struct {
  47. hostMap *HostMap
  48. outside *udpConn
  49. inside Inside
  50. certState *CertState
  51. cipher string
  52. firewall *Firewall
  53. connectionManager *connectionManager
  54. handshakeManager *HandshakeManager
  55. serveDns bool
  56. createTime time.Time
  57. lightHouse *LightHouse
  58. localBroadcast uint32
  59. myVpnIp uint32
  60. dropLocalBroadcast bool
  61. dropMulticast bool
  62. udpBatchSize int
  63. routines int
  64. caPool *cert.NebulaCAPool
  65. disconnectInvalid bool
  66. // rebindCount is used to decide if an active tunnel should trigger a punch notification through a lighthouse
  67. rebindCount int8
  68. version string
  69. conntrackCacheTimeout time.Duration
  70. writers []*udpConn
  71. readers []io.ReadWriteCloser
  72. metricHandshakes metrics.Histogram
  73. messageMetrics *MessageMetrics
  74. cachedPacketMetrics *cachedPacketMetrics
  75. l *logrus.Logger
  76. }
  77. func NewInterface(ctx context.Context, c *InterfaceConfig) (*Interface, error) {
  78. if c.Outside == nil {
  79. return nil, errors.New("no outside connection")
  80. }
  81. if c.Inside == nil {
  82. return nil, errors.New("no inside interface (tun)")
  83. }
  84. if c.certState == nil {
  85. return nil, errors.New("no certificate state")
  86. }
  87. if c.Firewall == nil {
  88. return nil, errors.New("no firewall rules")
  89. }
  90. ifce := &Interface{
  91. hostMap: c.HostMap,
  92. outside: c.Outside,
  93. inside: c.Inside,
  94. certState: c.certState,
  95. cipher: c.Cipher,
  96. firewall: c.Firewall,
  97. serveDns: c.ServeDns,
  98. handshakeManager: c.HandshakeManager,
  99. createTime: time.Now(),
  100. lightHouse: c.lightHouse,
  101. localBroadcast: ip2int(c.certState.certificate.Details.Ips[0].IP) | ^ip2int(c.certState.certificate.Details.Ips[0].Mask),
  102. dropLocalBroadcast: c.DropLocalBroadcast,
  103. dropMulticast: c.DropMulticast,
  104. udpBatchSize: c.UDPBatchSize,
  105. routines: c.routines,
  106. version: c.version,
  107. writers: make([]*udpConn, c.routines),
  108. readers: make([]io.ReadWriteCloser, c.routines),
  109. caPool: c.caPool,
  110. disconnectInvalid: c.disconnectInvalid,
  111. myVpnIp: ip2int(c.certState.certificate.Details.Ips[0].IP),
  112. conntrackCacheTimeout: c.ConntrackCacheTimeout,
  113. metricHandshakes: metrics.GetOrRegisterHistogram("handshakes", nil, metrics.NewExpDecaySample(1028, 0.015)),
  114. messageMetrics: c.MessageMetrics,
  115. cachedPacketMetrics: &cachedPacketMetrics{
  116. sent: metrics.GetOrRegisterCounter("hostinfo.cached_packets.sent", nil),
  117. dropped: metrics.GetOrRegisterCounter("hostinfo.cached_packets.dropped", nil),
  118. },
  119. l: c.l,
  120. }
  121. ifce.connectionManager = newConnectionManager(ctx, c.l, ifce, c.checkInterval, c.pendingDeletionInterval)
  122. return ifce, nil
  123. }
  124. // activate creates the interface on the host. After the interface is created, any
  125. // other services that want to bind listeners to its IP may do so successfully. However,
  126. // the interface isn't going to process anything until run() is called.
  127. func (f *Interface) activate() {
  128. // actually turn on tun dev
  129. addr, err := f.outside.LocalAddr()
  130. if err != nil {
  131. f.l.WithError(err).Error("Failed to get udp listen address")
  132. }
  133. f.l.WithField("interface", f.inside.DeviceName()).WithField("network", f.inside.CidrNet().String()).
  134. WithField("build", f.version).WithField("udpAddr", addr).
  135. Info("Nebula interface is active")
  136. metrics.GetOrRegisterGauge("routines", nil).Update(int64(f.routines))
  137. // Prepare n tun queues
  138. var reader io.ReadWriteCloser = f.inside
  139. for i := 0; i < f.routines; i++ {
  140. if i > 0 {
  141. reader, err = f.inside.NewMultiQueueReader()
  142. if err != nil {
  143. f.l.Fatal(err)
  144. }
  145. }
  146. f.readers[i] = reader
  147. }
  148. if err := f.inside.Activate(); err != nil {
  149. f.l.Fatal(err)
  150. }
  151. }
  152. func (f *Interface) run() {
  153. // Launch n queues to read packets from udp
  154. for i := 0; i < f.routines; i++ {
  155. go f.listenOut(i)
  156. }
  157. // Launch n queues to read packets from tun dev
  158. for i := 0; i < f.routines; i++ {
  159. go f.listenIn(f.readers[i], i)
  160. }
  161. }
  162. func (f *Interface) listenOut(i int) {
  163. runtime.LockOSThread()
  164. var li *udpConn
  165. // TODO clean this up with a coherent interface for each outside connection
  166. if i > 0 {
  167. li = f.writers[i]
  168. } else {
  169. li = f.outside
  170. }
  171. li.ListenOut(f, i)
  172. }
  173. func (f *Interface) listenIn(reader io.ReadWriteCloser, i int) {
  174. runtime.LockOSThread()
  175. packet := make([]byte, mtu)
  176. out := make([]byte, mtu)
  177. fwPacket := &FirewallPacket{}
  178. nb := make([]byte, 12, 12)
  179. conntrackCache := NewConntrackCacheTicker(f.conntrackCacheTimeout)
  180. for {
  181. n, err := reader.Read(packet)
  182. if err != nil {
  183. f.l.WithError(err).Error("Error while reading outbound packet")
  184. // This only seems to happen when something fatal happens to the fd, so exit.
  185. os.Exit(2)
  186. }
  187. f.consumeInsidePacket(packet[:n], fwPacket, nb, out, i, conntrackCache.Get(f.l))
  188. }
  189. }
  190. func (f *Interface) RegisterConfigChangeCallbacks(c *Config) {
  191. c.RegisterReloadCallback(f.reloadCA)
  192. c.RegisterReloadCallback(f.reloadCertKey)
  193. c.RegisterReloadCallback(f.reloadFirewall)
  194. for _, udpConn := range f.writers {
  195. c.RegisterReloadCallback(udpConn.reloadConfig)
  196. }
  197. }
  198. func (f *Interface) reloadCA(c *Config) {
  199. // reload and check regardless
  200. // todo: need mutex?
  201. newCAs, err := loadCAFromConfig(f.l, c)
  202. if err != nil {
  203. f.l.WithError(err).Error("Could not refresh trusted CA certificates")
  204. return
  205. }
  206. f.caPool = newCAs
  207. f.l.WithField("fingerprints", f.caPool.GetFingerprints()).Info("Trusted CA certificates refreshed")
  208. }
  209. func (f *Interface) reloadCertKey(c *Config) {
  210. // reload and check in all cases
  211. cs, err := NewCertStateFromConfig(c)
  212. if err != nil {
  213. f.l.WithError(err).Error("Could not refresh client cert")
  214. return
  215. }
  216. // did IP in cert change? if so, don't set
  217. oldIPs := f.certState.certificate.Details.Ips
  218. newIPs := cs.certificate.Details.Ips
  219. if len(oldIPs) > 0 && len(newIPs) > 0 && oldIPs[0].String() != newIPs[0].String() {
  220. f.l.WithField("new_ip", newIPs[0]).WithField("old_ip", oldIPs[0]).Error("IP in new cert was different from old")
  221. return
  222. }
  223. f.certState = cs
  224. f.l.WithField("cert", cs.certificate).Info("Client cert refreshed from disk")
  225. }
  226. func (f *Interface) reloadFirewall(c *Config) {
  227. //TODO: need to trigger/detect if the certificate changed too
  228. if c.HasChanged("firewall") == false {
  229. f.l.Debug("No firewall config change detected")
  230. return
  231. }
  232. fw, err := NewFirewallFromConfig(f.l, f.certState.certificate, c)
  233. if err != nil {
  234. f.l.WithError(err).Error("Error while creating firewall during reload")
  235. return
  236. }
  237. oldFw := f.firewall
  238. conntrack := oldFw.Conntrack
  239. conntrack.Lock()
  240. defer conntrack.Unlock()
  241. fw.rulesVersion = oldFw.rulesVersion + 1
  242. // If rulesVersion is back to zero, we have wrapped all the way around. Be
  243. // safe and just reset conntrack in this case.
  244. if fw.rulesVersion == 0 {
  245. f.l.WithField("firewallHash", fw.GetRuleHash()).
  246. WithField("oldFirewallHash", oldFw.GetRuleHash()).
  247. WithField("rulesVersion", fw.rulesVersion).
  248. Warn("firewall rulesVersion has overflowed, resetting conntrack")
  249. } else {
  250. fw.Conntrack = conntrack
  251. }
  252. f.firewall = fw
  253. oldFw.Destroy()
  254. f.l.WithField("firewallHash", fw.GetRuleHash()).
  255. WithField("oldFirewallHash", oldFw.GetRuleHash()).
  256. WithField("rulesVersion", fw.rulesVersion).
  257. Info("New firewall has been installed")
  258. }
  259. func (f *Interface) emitStats(ctx context.Context, i time.Duration) {
  260. ticker := time.NewTicker(i)
  261. defer ticker.Stop()
  262. udpStats := NewUDPStatsEmitter(f.writers)
  263. for {
  264. select {
  265. case <-ctx.Done():
  266. return
  267. case <-ticker.C:
  268. f.firewall.EmitStats()
  269. f.handshakeManager.EmitStats()
  270. udpStats()
  271. }
  272. }
  273. }