interface.go 7.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291
  1. package nebula
  2. import (
  3. "errors"
  4. "io"
  5. "net"
  6. "os"
  7. "runtime"
  8. "time"
  9. "github.com/rcrowley/go-metrics"
  10. )
  11. const mtu = 9001
  12. type Inside interface {
  13. io.ReadWriteCloser
  14. Activate() error
  15. CidrNet() *net.IPNet
  16. DeviceName() string
  17. WriteRaw([]byte) error
  18. NewMultiQueueReader() (io.ReadWriteCloser, error)
  19. }
  20. type InterfaceConfig struct {
  21. HostMap *HostMap
  22. Outside *udpConn
  23. Inside Inside
  24. certState *CertState
  25. Cipher string
  26. Firewall *Firewall
  27. ServeDns bool
  28. HandshakeManager *HandshakeManager
  29. lightHouse *LightHouse
  30. checkInterval int
  31. pendingDeletionInterval int
  32. DropLocalBroadcast bool
  33. DropMulticast bool
  34. UDPBatchSize int
  35. routines int
  36. MessageMetrics *MessageMetrics
  37. version string
  38. ConntrackCacheTimeout time.Duration
  39. }
  40. type Interface struct {
  41. hostMap *HostMap
  42. outside *udpConn
  43. inside Inside
  44. certState *CertState
  45. cipher string
  46. firewall *Firewall
  47. connectionManager *connectionManager
  48. handshakeManager *HandshakeManager
  49. serveDns bool
  50. createTime time.Time
  51. lightHouse *LightHouse
  52. localBroadcast uint32
  53. dropLocalBroadcast bool
  54. dropMulticast bool
  55. udpBatchSize int
  56. routines int
  57. // rebindCount is used to decide if an active tunnel should trigger a punch notification through a lighthouse
  58. rebindCount int8
  59. version string
  60. conntrackCacheTimeout time.Duration
  61. writers []*udpConn
  62. readers []io.ReadWriteCloser
  63. metricHandshakes metrics.Histogram
  64. messageMetrics *MessageMetrics
  65. }
  66. func NewInterface(c *InterfaceConfig) (*Interface, error) {
  67. if c.Outside == nil {
  68. return nil, errors.New("no outside connection")
  69. }
  70. if c.Inside == nil {
  71. return nil, errors.New("no inside interface (tun)")
  72. }
  73. if c.certState == nil {
  74. return nil, errors.New("no certificate state")
  75. }
  76. if c.Firewall == nil {
  77. return nil, errors.New("no firewall rules")
  78. }
  79. ifce := &Interface{
  80. hostMap: c.HostMap,
  81. outside: c.Outside,
  82. inside: c.Inside,
  83. certState: c.certState,
  84. cipher: c.Cipher,
  85. firewall: c.Firewall,
  86. serveDns: c.ServeDns,
  87. handshakeManager: c.HandshakeManager,
  88. createTime: time.Now(),
  89. lightHouse: c.lightHouse,
  90. localBroadcast: ip2int(c.certState.certificate.Details.Ips[0].IP) | ^ip2int(c.certState.certificate.Details.Ips[0].Mask),
  91. dropLocalBroadcast: c.DropLocalBroadcast,
  92. dropMulticast: c.DropMulticast,
  93. udpBatchSize: c.UDPBatchSize,
  94. routines: c.routines,
  95. version: c.version,
  96. writers: make([]*udpConn, c.routines),
  97. readers: make([]io.ReadWriteCloser, c.routines),
  98. conntrackCacheTimeout: c.ConntrackCacheTimeout,
  99. metricHandshakes: metrics.GetOrRegisterHistogram("handshakes", nil, metrics.NewExpDecaySample(1028, 0.015)),
  100. messageMetrics: c.MessageMetrics,
  101. }
  102. ifce.connectionManager = newConnectionManager(ifce, c.checkInterval, c.pendingDeletionInterval)
  103. return ifce, nil
  104. }
  105. func (f *Interface) run() {
  106. // actually turn on tun dev
  107. addr, err := f.outside.LocalAddr()
  108. if err != nil {
  109. l.WithError(err).Error("Failed to get udp listen address")
  110. }
  111. l.WithField("interface", f.inside.DeviceName()).WithField("network", f.inside.CidrNet().String()).
  112. WithField("build", f.version).WithField("udpAddr", addr).
  113. Info("Nebula interface is active")
  114. metrics.GetOrRegisterGauge("routines", nil).Update(int64(f.routines))
  115. // Prepare n tun queues
  116. var reader io.ReadWriteCloser = f.inside
  117. for i := 0; i < f.routines; i++ {
  118. if i > 0 {
  119. reader, err = f.inside.NewMultiQueueReader()
  120. if err != nil {
  121. l.Fatal(err)
  122. }
  123. }
  124. f.readers[i] = reader
  125. }
  126. if err := f.inside.Activate(); err != nil {
  127. l.Fatal(err)
  128. }
  129. // Launch n queues to read packets from udp
  130. for i := 0; i < f.routines; i++ {
  131. go f.listenOut(i)
  132. }
  133. // Launch n queues to read packets from tun dev
  134. for i := 0; i < f.routines; i++ {
  135. go f.listenIn(f.readers[i], i)
  136. }
  137. }
  138. func (f *Interface) listenOut(i int) {
  139. runtime.LockOSThread()
  140. var li *udpConn
  141. // TODO clean this up with a coherent interface for each outside connection
  142. if i > 0 {
  143. li = f.writers[i]
  144. } else {
  145. li = f.outside
  146. }
  147. li.ListenOut(f, i)
  148. }
  149. func (f *Interface) listenIn(reader io.ReadWriteCloser, i int) {
  150. runtime.LockOSThread()
  151. packet := make([]byte, mtu)
  152. out := make([]byte, mtu)
  153. fwPacket := &FirewallPacket{}
  154. nb := make([]byte, 12, 12)
  155. conntrackCache := NewConntrackCacheTicker(f.conntrackCacheTimeout)
  156. for {
  157. n, err := reader.Read(packet)
  158. if err != nil {
  159. l.WithError(err).Error("Error while reading outbound packet")
  160. // This only seems to happen when something fatal happens to the fd, so exit.
  161. os.Exit(2)
  162. }
  163. f.consumeInsidePacket(packet[:n], fwPacket, nb, out, i, conntrackCache.Get())
  164. }
  165. }
  166. func (f *Interface) RegisterConfigChangeCallbacks(c *Config) {
  167. c.RegisterReloadCallback(f.reloadCA)
  168. c.RegisterReloadCallback(f.reloadCertKey)
  169. c.RegisterReloadCallback(f.reloadFirewall)
  170. for _, udpConn := range f.writers {
  171. c.RegisterReloadCallback(udpConn.reloadConfig)
  172. }
  173. }
  174. func (f *Interface) reloadCA(c *Config) {
  175. // reload and check regardless
  176. // todo: need mutex?
  177. newCAs, err := loadCAFromConfig(c)
  178. if err != nil {
  179. l.WithError(err).Error("Could not refresh trusted CA certificates")
  180. return
  181. }
  182. trustedCAs = newCAs
  183. l.WithField("fingerprints", trustedCAs.GetFingerprints()).Info("Trusted CA certificates refreshed")
  184. }
  185. func (f *Interface) reloadCertKey(c *Config) {
  186. // reload and check in all cases
  187. cs, err := NewCertStateFromConfig(c)
  188. if err != nil {
  189. l.WithError(err).Error("Could not refresh client cert")
  190. return
  191. }
  192. // did IP in cert change? if so, don't set
  193. oldIPs := f.certState.certificate.Details.Ips
  194. newIPs := cs.certificate.Details.Ips
  195. if len(oldIPs) > 0 && len(newIPs) > 0 && oldIPs[0].String() != newIPs[0].String() {
  196. l.WithField("new_ip", newIPs[0]).WithField("old_ip", oldIPs[0]).Error("IP in new cert was different from old")
  197. return
  198. }
  199. f.certState = cs
  200. l.WithField("cert", cs.certificate).Info("Client cert refreshed from disk")
  201. }
  202. func (f *Interface) reloadFirewall(c *Config) {
  203. //TODO: need to trigger/detect if the certificate changed too
  204. if c.HasChanged("firewall") == false {
  205. l.Debug("No firewall config change detected")
  206. return
  207. }
  208. fw, err := NewFirewallFromConfig(f.certState.certificate, c)
  209. if err != nil {
  210. l.WithError(err).Error("Error while creating firewall during reload")
  211. return
  212. }
  213. oldFw := f.firewall
  214. conntrack := oldFw.Conntrack
  215. conntrack.Lock()
  216. defer conntrack.Unlock()
  217. fw.rulesVersion = oldFw.rulesVersion + 1
  218. // If rulesVersion is back to zero, we have wrapped all the way around. Be
  219. // safe and just reset conntrack in this case.
  220. if fw.rulesVersion == 0 {
  221. l.WithField("firewallHash", fw.GetRuleHash()).
  222. WithField("oldFirewallHash", oldFw.GetRuleHash()).
  223. WithField("rulesVersion", fw.rulesVersion).
  224. Warn("firewall rulesVersion has overflowed, resetting conntrack")
  225. } else {
  226. fw.Conntrack = conntrack
  227. }
  228. f.firewall = fw
  229. oldFw.Destroy()
  230. l.WithField("firewallHash", fw.GetRuleHash()).
  231. WithField("oldFirewallHash", oldFw.GetRuleHash()).
  232. WithField("rulesVersion", fw.rulesVersion).
  233. Info("New firewall has been installed")
  234. }
  235. func (f *Interface) emitStats(i time.Duration) {
  236. ticker := time.NewTicker(i)
  237. udpStats := NewUDPStatsEmitter(f.writers)
  238. for range ticker.C {
  239. f.firewall.EmitStats()
  240. f.handshakeManager.EmitStats()
  241. udpStats()
  242. }
  243. }