123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643 |
- //go:build !e2e_testing
- // +build !e2e_testing
- package overlay
- import (
- "bytes"
- "errors"
- "fmt"
- "io"
- "io/fs"
- "net/netip"
- "sync/atomic"
- "syscall"
- "time"
- "unsafe"
- "github.com/gaissmai/bart"
- "github.com/sirupsen/logrus"
- "github.com/slackhq/nebula/config"
- "github.com/slackhq/nebula/routing"
- "github.com/slackhq/nebula/util"
- netroute "golang.org/x/net/route"
- "golang.org/x/sys/unix"
- )
- const (
- // FIODGNAME is defined in sys/sys/filio.h on FreeBSD
- // For 32-bit systems, use FIODGNAME_32 (not defined in this file: 0x80086678)
- FIODGNAME = 0x80106678
- TUNSIFMODE = 0x8004745e
- TUNSIFHEAD = 0x80047460
- OSIOCAIFADDR_IN6 = 0x8088691b
- IN6_IFF_NODAD = 0x0020
- )
- type fiodgnameArg struct {
- length int32
- pad [4]byte
- buf unsafe.Pointer
- }
- type ifreqRename struct {
- Name [unix.IFNAMSIZ]byte
- Data uintptr
- }
- type ifreqDestroy struct {
- Name [unix.IFNAMSIZ]byte
- pad [16]byte
- }
- type ifReq struct {
- Name [unix.IFNAMSIZ]byte
- Flags uint16
- }
- type ifreqMTU struct {
- Name [unix.IFNAMSIZ]byte
- MTU int32
- }
- type addrLifetime struct {
- Expire uint64
- Preferred uint64
- Vltime uint32
- Pltime uint32
- }
- type ifreqAlias4 struct {
- Name [unix.IFNAMSIZ]byte
- Addr unix.RawSockaddrInet4
- DstAddr unix.RawSockaddrInet4
- MaskAddr unix.RawSockaddrInet4
- VHid uint32
- }
- type ifreqAlias6 struct {
- Name [unix.IFNAMSIZ]byte
- Addr unix.RawSockaddrInet6
- DstAddr unix.RawSockaddrInet6
- PrefixMask unix.RawSockaddrInet6
- Flags uint32
- Lifetime addrLifetime
- VHid uint32
- }
- type tun struct {
- Device string
- vpnNetworks []netip.Prefix
- MTU int
- Routes atomic.Pointer[[]Route]
- routeTree atomic.Pointer[bart.Table[routing.Gateways]]
- linkAddr *netroute.LinkAddr
- l *logrus.Logger
- devFd int
- }
- func (t *tun) Read(to []byte) (int, error) {
- // use readv() to read from the tunnel device, to eliminate the need for copying the buffer
- if t.devFd < 0 {
- return -1, syscall.EINVAL
- }
- // first 4 bytes is protocol family, in network byte order
- head := make([]byte, 4)
- iovecs := []syscall.Iovec{
- {&head[0], 4},
- {&to[0], uint64(len(to))},
- }
- n, _, errno := syscall.Syscall(syscall.SYS_READV, uintptr(t.devFd), uintptr(unsafe.Pointer(&iovecs[0])), uintptr(2))
- var err error
- if errno != 0 {
- err = syscall.Errno(errno)
- } else {
- err = nil
- }
- // fix bytes read number to exclude header
- bytesRead := int(n)
- if bytesRead < 0 {
- return bytesRead, err
- } else if bytesRead < 4 {
- return 0, err
- } else {
- return bytesRead - 4, err
- }
- }
- // Write is only valid for single threaded use
- func (t *tun) Write(from []byte) (int, error) {
- // use writev() to write to the tunnel device, to eliminate the need for copying the buffer
- if t.devFd < 0 {
- return -1, syscall.EINVAL
- }
- if len(from) <= 1 {
- return 0, syscall.EIO
- }
- ipVer := from[0] >> 4
- var head []byte
- // first 4 bytes is protocol family, in network byte order
- if ipVer == 4 {
- head = []byte{0, 0, 0, syscall.AF_INET}
- } else if ipVer == 6 {
- head = []byte{0, 0, 0, syscall.AF_INET6}
- } else {
- return 0, fmt.Errorf("unable to determine IP version from packet")
- }
- iovecs := []syscall.Iovec{
- {&head[0], 4},
- {&from[0], uint64(len(from))},
- }
- n, _, errno := syscall.Syscall(syscall.SYS_WRITEV, uintptr(t.devFd), uintptr(unsafe.Pointer(&iovecs[0])), uintptr(2))
- var err error
- if errno != 0 {
- err = syscall.Errno(errno)
- } else {
- err = nil
- }
- return int(n) - 4, err
- }
- func (t *tun) Close() error {
- if t.devFd >= 0 {
- err := syscall.Close(t.devFd)
- if err != nil {
- t.l.WithError(err).Error("Error closing device")
- }
- t.devFd = -1
- c := make(chan struct{})
- go func() {
- // destroying the interface can block if a read() is still pending. Do this asynchronously.
- defer close(c)
- s, err := syscall.Socket(syscall.AF_INET, syscall.SOCK_DGRAM, syscall.IPPROTO_IP)
- if err == nil {
- defer syscall.Close(s)
- ifreq := ifreqDestroy{Name: t.deviceBytes()}
- err = ioctl(uintptr(s), syscall.SIOCIFDESTROY, uintptr(unsafe.Pointer(&ifreq)))
- }
- if err != nil {
- t.l.WithError(err).Error("Error destroying tunnel")
- }
- }()
- // wait up to 1 second so we start blocking at the ioctl
- select {
- case <-c:
- case <-time.After(1 * time.Second):
- }
- }
- return nil
- }
- func newTunFromFd(_ *config.C, _ *logrus.Logger, _ int, _ []netip.Prefix) (*tun, error) {
- return nil, fmt.Errorf("newTunFromFd not supported in FreeBSD")
- }
- func newTun(c *config.C, l *logrus.Logger, vpnNetworks []netip.Prefix, _ bool) (*tun, error) {
- // Try to open existing tun device
- var fd int
- var err error
- deviceName := c.GetString("tun.dev", "")
- if deviceName != "" {
- fd, err = syscall.Open("/dev/"+deviceName, syscall.O_RDWR, 0)
- }
- if errors.Is(err, fs.ErrNotExist) || deviceName == "" {
- // If the device doesn't already exist, request a new one and rename it
- fd, err = syscall.Open("/dev/tun", syscall.O_RDWR, 0)
- }
- if err != nil {
- return nil, err
- }
- // Read the name of the interface
- var name [16]byte
- arg := fiodgnameArg{length: 16, buf: unsafe.Pointer(&name)}
- ctrlErr := ioctl(uintptr(fd), FIODGNAME, uintptr(unsafe.Pointer(&arg)))
- if ctrlErr == nil {
- // set broadcast mode and multicast
- ifmode := uint32(unix.IFF_BROADCAST | unix.IFF_MULTICAST)
- ctrlErr = ioctl(uintptr(fd), TUNSIFMODE, uintptr(unsafe.Pointer(&ifmode)))
- }
- if ctrlErr == nil {
- // turn on link-layer mode, to support ipv6
- ifhead := uint32(1)
- ctrlErr = ioctl(uintptr(fd), TUNSIFHEAD, uintptr(unsafe.Pointer(&ifhead)))
- }
- if ctrlErr != nil {
- return nil, err
- }
- ifName := string(bytes.TrimRight(name[:], "\x00"))
- if deviceName == "" {
- deviceName = ifName
- }
- // If the name doesn't match the desired interface name, rename it now
- if ifName != deviceName {
- s, err := unix.Socket(unix.AF_INET, unix.SOCK_DGRAM, unix.IPPROTO_IP)
- if err != nil {
- return nil, err
- }
- defer syscall.Close(s)
- fd := uintptr(s)
- var fromName [16]byte
- var toName [16]byte
- copy(fromName[:], ifName)
- copy(toName[:], deviceName)
- ifrr := ifreqRename{
- Name: fromName,
- Data: uintptr(unsafe.Pointer(&toName)),
- }
- // Set the device name
- ioctl(fd, syscall.SIOCSIFNAME, uintptr(unsafe.Pointer(&ifrr)))
- }
- t := &tun{
- Device: deviceName,
- vpnNetworks: vpnNetworks,
- MTU: c.GetInt("tun.mtu", DefaultMTU),
- l: l,
- devFd: fd,
- }
- err = t.reload(c, true)
- if err != nil {
- return nil, err
- }
- c.RegisterReloadCallback(func(c *config.C) {
- err := t.reload(c, false)
- if err != nil {
- util.LogWithContextIfNeeded("failed to reload tun device", err, t.l)
- }
- })
- return t, nil
- }
- func (t *tun) addIp(cidr netip.Prefix) error {
- if cidr.Addr().Is4() {
- ifr := ifreqAlias4{
- Name: t.deviceBytes(),
- Addr: unix.RawSockaddrInet4{
- Len: unix.SizeofSockaddrInet4,
- Family: unix.AF_INET,
- Addr: cidr.Addr().As4(),
- },
- DstAddr: unix.RawSockaddrInet4{
- Len: unix.SizeofSockaddrInet4,
- Family: unix.AF_INET,
- Addr: getBroadcast(cidr).As4(),
- },
- MaskAddr: unix.RawSockaddrInet4{
- Len: unix.SizeofSockaddrInet4,
- Family: unix.AF_INET,
- Addr: prefixToMask(cidr).As4(),
- },
- VHid: 0,
- }
- s, err := unix.Socket(unix.AF_INET, unix.SOCK_DGRAM, unix.IPPROTO_IP)
- if err != nil {
- return err
- }
- defer syscall.Close(s)
- // Note: unix.SIOCAIFADDR corresponds to FreeBSD's OSIOCAIFADDR
- if err := ioctl(uintptr(s), unix.SIOCAIFADDR, uintptr(unsafe.Pointer(&ifr))); err != nil {
- return fmt.Errorf("failed to set tun address %s: %s", cidr.Addr().String(), err)
- }
- return nil
- }
- if cidr.Addr().Is6() {
- ifr := ifreqAlias6{
- Name: t.deviceBytes(),
- Addr: unix.RawSockaddrInet6{
- Len: unix.SizeofSockaddrInet6,
- Family: unix.AF_INET6,
- Addr: cidr.Addr().As16(),
- },
- PrefixMask: unix.RawSockaddrInet6{
- Len: unix.SizeofSockaddrInet6,
- Family: unix.AF_INET6,
- Addr: prefixToMask(cidr).As16(),
- },
- Lifetime: addrLifetime{
- Expire: 0,
- Preferred: 0,
- Vltime: 0xffffffff,
- Pltime: 0xffffffff,
- },
- Flags: IN6_IFF_NODAD,
- }
- s, err := syscall.Socket(syscall.AF_INET6, syscall.SOCK_DGRAM, syscall.IPPROTO_IP)
- if err != nil {
- return err
- }
- defer syscall.Close(s)
- if err := ioctl(uintptr(s), OSIOCAIFADDR_IN6, uintptr(unsafe.Pointer(&ifr))); err != nil {
- return fmt.Errorf("failed to set tun address %s: %s", cidr.Addr().String(), err)
- }
- return nil
- }
- return fmt.Errorf("unknown address type %v", cidr)
- }
- func (t *tun) Activate() error {
- // Setup our default MTU
- err := t.setMTU()
- if err != nil {
- return err
- }
- linkAddr, err := getLinkAddr(t.Device)
- if err != nil {
- return err
- }
- if linkAddr == nil {
- return fmt.Errorf("unable to discover link_addr for tun interface")
- }
- t.linkAddr = linkAddr
- for i := range t.vpnNetworks {
- err := t.addIp(t.vpnNetworks[i])
- if err != nil {
- return err
- }
- }
- return t.addRoutes(false)
- }
- func (t *tun) setMTU() error {
- // Set the MTU on the device
- s, err := unix.Socket(unix.AF_INET, unix.SOCK_DGRAM, unix.IPPROTO_IP)
- if err != nil {
- return err
- }
- defer syscall.Close(s)
- ifm := ifreqMTU{Name: t.deviceBytes(), MTU: int32(t.MTU)}
- err = ioctl(uintptr(s), unix.SIOCSIFMTU, uintptr(unsafe.Pointer(&ifm)))
- return err
- }
- func (t *tun) reload(c *config.C, initial bool) error {
- change, routes, err := getAllRoutesFromConfig(c, t.vpnNetworks, initial)
- if err != nil {
- return err
- }
- if !initial && !change {
- return nil
- }
- routeTree, err := makeRouteTree(t.l, routes, false)
- if err != nil {
- return err
- }
- // Teach nebula how to handle the routes before establishing them in the system table
- oldRoutes := t.Routes.Swap(&routes)
- t.routeTree.Store(routeTree)
- if !initial {
- // Remove first, if the system removes a wanted route hopefully it will be re-added next
- err := t.removeRoutes(findRemovedRoutes(routes, *oldRoutes))
- if err != nil {
- util.LogWithContextIfNeeded("Failed to remove routes", err, t.l)
- }
- // Ensure any routes we actually want are installed
- err = t.addRoutes(true)
- if err != nil {
- // Catch any stray logs
- util.LogWithContextIfNeeded("Failed to add routes", err, t.l)
- }
- }
- return nil
- }
- func (t *tun) RoutesFor(ip netip.Addr) routing.Gateways {
- r, _ := t.routeTree.Load().Lookup(ip)
- return r
- }
- func (t *tun) Networks() []netip.Prefix {
- return t.vpnNetworks
- }
- func (t *tun) Name() string {
- return t.Device
- }
- func (t *tun) NewMultiQueueReader() (io.ReadWriteCloser, error) {
- return nil, fmt.Errorf("TODO: multiqueue not implemented for freebsd")
- }
- func (t *tun) addRoutes(logErrors bool) error {
- routes := *t.Routes.Load()
- for _, r := range routes {
- if len(r.Via) == 0 || !r.Install {
- // We don't allow route MTUs so only install routes with a via
- continue
- }
- err := addRoute(r.Cidr, t.linkAddr)
- if err != nil {
- retErr := util.NewContextualError("Failed to add route", map[string]any{"route": r}, err)
- if logErrors {
- retErr.Log(t.l)
- } else {
- return retErr
- }
- } else {
- t.l.WithField("route", r).Info("Added route")
- }
- }
- return nil
- }
- func (t *tun) removeRoutes(routes []Route) error {
- for _, r := range routes {
- if !r.Install {
- continue
- }
- err := delRoute(r.Cidr, t.linkAddr)
- if err != nil {
- t.l.WithError(err).WithField("route", r).Error("Failed to remove route")
- } else {
- t.l.WithField("route", r).Info("Removed route")
- }
- }
- return nil
- }
- func (t *tun) deviceBytes() (o [16]byte) {
- for i, c := range t.Device {
- o[i] = byte(c)
- }
- return
- }
- func flipBytes(b []byte) []byte {
- for i := 0; i < len(b); i++ {
- b[i] ^= 0xFF
- }
- return b
- }
- func orBytes(a []byte, b []byte) []byte {
- ret := make([]byte, len(a))
- for i := 0; i < len(a); i++ {
- ret[i] = a[i] | b[i]
- }
- return ret
- }
- func getBroadcast(cidr netip.Prefix) netip.Addr {
- broadcast, _ := netip.AddrFromSlice(
- orBytes(
- cidr.Addr().AsSlice(),
- flipBytes(prefixToMask(cidr).AsSlice()),
- ),
- )
- return broadcast
- }
- func addRoute(prefix netip.Prefix, gateway netroute.Addr) error {
- sock, err := unix.Socket(unix.AF_ROUTE, unix.SOCK_RAW, unix.AF_UNSPEC)
- if err != nil {
- return fmt.Errorf("unable to create AF_ROUTE socket: %v", err)
- }
- defer unix.Close(sock)
- route := &netroute.RouteMessage{
- Version: unix.RTM_VERSION,
- Type: unix.RTM_ADD,
- Flags: unix.RTF_UP,
- Seq: 1,
- }
- if prefix.Addr().Is4() {
- route.Addrs = []netroute.Addr{
- unix.RTAX_DST: &netroute.Inet4Addr{IP: prefix.Masked().Addr().As4()},
- unix.RTAX_NETMASK: &netroute.Inet4Addr{IP: prefixToMask(prefix).As4()},
- unix.RTAX_GATEWAY: gateway,
- }
- } else {
- route.Addrs = []netroute.Addr{
- unix.RTAX_DST: &netroute.Inet6Addr{IP: prefix.Masked().Addr().As16()},
- unix.RTAX_NETMASK: &netroute.Inet6Addr{IP: prefixToMask(prefix).As16()},
- unix.RTAX_GATEWAY: gateway,
- }
- }
- data, err := route.Marshal()
- if err != nil {
- return fmt.Errorf("failed to create route.RouteMessage: %w", err)
- }
- _, err = unix.Write(sock, data[:])
- if err != nil {
- if errors.Is(err, unix.EEXIST) {
- // Try to do a change
- route.Type = unix.RTM_CHANGE
- data, err = route.Marshal()
- if err != nil {
- return fmt.Errorf("failed to create route.RouteMessage for change: %w", err)
- }
- _, err = unix.Write(sock, data[:])
- fmt.Println("DOING CHANGE")
- return err
- }
- return fmt.Errorf("failed to write route.RouteMessage to socket: %w", err)
- }
- return nil
- }
- func delRoute(prefix netip.Prefix, gateway netroute.Addr) error {
- sock, err := unix.Socket(unix.AF_ROUTE, unix.SOCK_RAW, unix.AF_UNSPEC)
- if err != nil {
- return fmt.Errorf("unable to create AF_ROUTE socket: %v", err)
- }
- defer unix.Close(sock)
- route := netroute.RouteMessage{
- Version: unix.RTM_VERSION,
- Type: unix.RTM_DELETE,
- Seq: 1,
- }
- if prefix.Addr().Is4() {
- route.Addrs = []netroute.Addr{
- unix.RTAX_DST: &netroute.Inet4Addr{IP: prefix.Masked().Addr().As4()},
- unix.RTAX_NETMASK: &netroute.Inet4Addr{IP: prefixToMask(prefix).As4()},
- unix.RTAX_GATEWAY: gateway,
- }
- } else {
- route.Addrs = []netroute.Addr{
- unix.RTAX_DST: &netroute.Inet6Addr{IP: prefix.Masked().Addr().As16()},
- unix.RTAX_NETMASK: &netroute.Inet6Addr{IP: prefixToMask(prefix).As16()},
- unix.RTAX_GATEWAY: gateway,
- }
- }
- data, err := route.Marshal()
- if err != nil {
- return fmt.Errorf("failed to create route.RouteMessage: %w", err)
- }
- _, err = unix.Write(sock, data[:])
- if err != nil {
- return fmt.Errorf("failed to write route.RouteMessage to socket: %w", err)
- }
- return nil
- }
- // getLinkAddr Gets the link address for the interface of the given name
- func getLinkAddr(name string) (*netroute.LinkAddr, error) {
- rib, err := netroute.FetchRIB(unix.AF_UNSPEC, unix.NET_RT_IFLIST, 0)
- if err != nil {
- return nil, err
- }
- msgs, err := netroute.ParseRIB(unix.NET_RT_IFLIST, rib)
- if err != nil {
- return nil, err
- }
- for _, m := range msgs {
- switch m := m.(type) {
- case *netroute.InterfaceMessage:
- if m.Name == name {
- sa, ok := m.Addrs[unix.RTAX_IFP].(*netroute.LinkAddr)
- if ok {
- return sa, nil
- }
- }
- }
- }
- return nil, nil
- }
|