| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291 | package nebulaimport (	"errors"	"io"	"net"	"os"	"runtime"	"time"	"github.com/rcrowley/go-metrics")const mtu = 9001type Inside interface {	io.ReadWriteCloser	Activate() error	CidrNet() *net.IPNet	DeviceName() string	WriteRaw([]byte) error	NewMultiQueueReader() (io.ReadWriteCloser, error)}type InterfaceConfig struct {	HostMap                 *HostMap	Outside                 *udpConn	Inside                  Inside	certState               *CertState	Cipher                  string	Firewall                *Firewall	ServeDns                bool	HandshakeManager        *HandshakeManager	lightHouse              *LightHouse	checkInterval           int	pendingDeletionInterval int	DropLocalBroadcast      bool	DropMulticast           bool	UDPBatchSize            int	routines                int	MessageMetrics          *MessageMetrics	version                 string	ConntrackCacheTimeout time.Duration}type Interface struct {	hostMap            *HostMap	outside            *udpConn	inside             Inside	certState          *CertState	cipher             string	firewall           *Firewall	connectionManager  *connectionManager	handshakeManager   *HandshakeManager	serveDns           bool	createTime         time.Time	lightHouse         *LightHouse	localBroadcast     uint32	dropLocalBroadcast bool	dropMulticast      bool	udpBatchSize       int	routines           int	// rebindCount is used to decide if an active tunnel should trigger a punch notification through a lighthouse	rebindCount int8	version     string	conntrackCacheTimeout time.Duration	writers []*udpConn	readers []io.ReadWriteCloser	metricHandshakes metrics.Histogram	messageMetrics   *MessageMetrics}func NewInterface(c *InterfaceConfig) (*Interface, error) {	if c.Outside == nil {		return nil, errors.New("no outside connection")	}	if c.Inside == nil {		return nil, errors.New("no inside interface (tun)")	}	if c.certState == nil {		return nil, errors.New("no certificate state")	}	if c.Firewall == nil {		return nil, errors.New("no firewall rules")	}	ifce := &Interface{		hostMap:            c.HostMap,		outside:            c.Outside,		inside:             c.Inside,		certState:          c.certState,		cipher:             c.Cipher,		firewall:           c.Firewall,		serveDns:           c.ServeDns,		handshakeManager:   c.HandshakeManager,		createTime:         time.Now(),		lightHouse:         c.lightHouse,		localBroadcast:     ip2int(c.certState.certificate.Details.Ips[0].IP) | ^ip2int(c.certState.certificate.Details.Ips[0].Mask),		dropLocalBroadcast: c.DropLocalBroadcast,		dropMulticast:      c.DropMulticast,		udpBatchSize:       c.UDPBatchSize,		routines:           c.routines,		version:            c.version,		writers:            make([]*udpConn, c.routines),		readers:            make([]io.ReadWriteCloser, c.routines),		conntrackCacheTimeout: c.ConntrackCacheTimeout,		metricHandshakes: metrics.GetOrRegisterHistogram("handshakes", nil, metrics.NewExpDecaySample(1028, 0.015)),		messageMetrics:   c.MessageMetrics,	}	ifce.connectionManager = newConnectionManager(ifce, c.checkInterval, c.pendingDeletionInterval)	return ifce, nil}func (f *Interface) run() {	// actually turn on tun dev	addr, err := f.outside.LocalAddr()	if err != nil {		l.WithError(err).Error("Failed to get udp listen address")	}	l.WithField("interface", f.inside.DeviceName()).WithField("network", f.inside.CidrNet().String()).		WithField("build", f.version).WithField("udpAddr", addr).		Info("Nebula interface is active")	metrics.GetOrRegisterGauge("routines", nil).Update(int64(f.routines))	// Prepare n tun queues	var reader io.ReadWriteCloser = f.inside	for i := 0; i < f.routines; i++ {		if i > 0 {			reader, err = f.inside.NewMultiQueueReader()			if err != nil {				l.Fatal(err)			}		}		f.readers[i] = reader	}	if err := f.inside.Activate(); err != nil {		l.Fatal(err)	}	// Launch n queues to read packets from udp	for i := 0; i < f.routines; i++ {		go f.listenOut(i)	}	// Launch n queues to read packets from tun dev	for i := 0; i < f.routines; i++ {		go f.listenIn(f.readers[i], i)	}}func (f *Interface) listenOut(i int) {	runtime.LockOSThread()	var li *udpConn	// TODO clean this up with a coherent interface for each outside connection	if i > 0 {		li = f.writers[i]	} else {		li = f.outside	}	li.ListenOut(f, i)}func (f *Interface) listenIn(reader io.ReadWriteCloser, i int) {	runtime.LockOSThread()	packet := make([]byte, mtu)	out := make([]byte, mtu)	fwPacket := &FirewallPacket{}	nb := make([]byte, 12, 12)	conntrackCache := NewConntrackCacheTicker(f.conntrackCacheTimeout)	for {		n, err := reader.Read(packet)		if err != nil {			l.WithError(err).Error("Error while reading outbound packet")			// This only seems to happen when something fatal happens to the fd, so exit.			os.Exit(2)		}		f.consumeInsidePacket(packet[:n], fwPacket, nb, out, i, conntrackCache.Get())	}}func (f *Interface) RegisterConfigChangeCallbacks(c *Config) {	c.RegisterReloadCallback(f.reloadCA)	c.RegisterReloadCallback(f.reloadCertKey)	c.RegisterReloadCallback(f.reloadFirewall)	for _, udpConn := range f.writers {		c.RegisterReloadCallback(udpConn.reloadConfig)	}}func (f *Interface) reloadCA(c *Config) {	// reload and check regardless	// todo: need mutex?	newCAs, err := loadCAFromConfig(c)	if err != nil {		l.WithError(err).Error("Could not refresh trusted CA certificates")		return	}	trustedCAs = newCAs	l.WithField("fingerprints", trustedCAs.GetFingerprints()).Info("Trusted CA certificates refreshed")}func (f *Interface) reloadCertKey(c *Config) {	// reload and check in all cases	cs, err := NewCertStateFromConfig(c)	if err != nil {		l.WithError(err).Error("Could not refresh client cert")		return	}	// did IP in cert change? if so, don't set	oldIPs := f.certState.certificate.Details.Ips	newIPs := cs.certificate.Details.Ips	if len(oldIPs) > 0 && len(newIPs) > 0 && oldIPs[0].String() != newIPs[0].String() {		l.WithField("new_ip", newIPs[0]).WithField("old_ip", oldIPs[0]).Error("IP in new cert was different from old")		return	}	f.certState = cs	l.WithField("cert", cs.certificate).Info("Client cert refreshed from disk")}func (f *Interface) reloadFirewall(c *Config) {	//TODO: need to trigger/detect if the certificate changed too	if c.HasChanged("firewall") == false {		l.Debug("No firewall config change detected")		return	}	fw, err := NewFirewallFromConfig(f.certState.certificate, c)	if err != nil {		l.WithError(err).Error("Error while creating firewall during reload")		return	}	oldFw := f.firewall	conntrack := oldFw.Conntrack	conntrack.Lock()	defer conntrack.Unlock()	fw.rulesVersion = oldFw.rulesVersion + 1	// If rulesVersion is back to zero, we have wrapped all the way around. Be	// safe and just reset conntrack in this case.	if fw.rulesVersion == 0 {		l.WithField("firewallHash", fw.GetRuleHash()).			WithField("oldFirewallHash", oldFw.GetRuleHash()).			WithField("rulesVersion", fw.rulesVersion).			Warn("firewall rulesVersion has overflowed, resetting conntrack")	} else {		fw.Conntrack = conntrack	}	f.firewall = fw	oldFw.Destroy()	l.WithField("firewallHash", fw.GetRuleHash()).		WithField("oldFirewallHash", oldFw.GetRuleHash()).		WithField("rulesVersion", fw.rulesVersion).		Info("New firewall has been installed")}func (f *Interface) emitStats(i time.Duration) {	ticker := time.NewTicker(i)	udpStats := NewUDPStatsEmitter(f.writers)	for range ticker.C {		f.firewall.EmitStats()		f.handshakeManager.EmitStats()		udpStats()	}}
 |