123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565 |
- //go:build !ios && !e2e_testing
- // +build !ios,!e2e_testing
- package overlay
- import (
- "errors"
- "fmt"
- "io"
- "net"
- "net/netip"
- "os"
- "sync/atomic"
- "syscall"
- "unsafe"
- "github.com/gaissmai/bart"
- "github.com/sirupsen/logrus"
- "github.com/slackhq/nebula/config"
- "github.com/slackhq/nebula/util"
- netroute "golang.org/x/net/route"
- "golang.org/x/sys/unix"
- )
- type tun struct {
- io.ReadWriteCloser
- Device string
- vpnNetworks []netip.Prefix
- DefaultMTU int
- Routes atomic.Pointer[[]Route]
- routeTree atomic.Pointer[bart.Table[netip.Addr]]
- linkAddr *netroute.LinkAddr
- l *logrus.Logger
- // cache out buffer since we need to prepend 4 bytes for tun metadata
- out []byte
- }
- type ifReq struct {
- Name [unix.IFNAMSIZ]byte
- Flags uint16
- pad [8]byte
- }
- const (
- _SIOCAIFADDR_IN6 = 2155899162
- _UTUN_OPT_IFNAME = 2
- _IN6_IFF_NODAD = 0x0020
- _IN6_IFF_SECURED = 0x0400
- utunControlName = "com.apple.net.utun_control"
- )
- type ifreqMTU struct {
- Name [16]byte
- MTU int32
- pad [8]byte
- }
- type addrLifetime struct {
- Expire float64
- Preferred float64
- Vltime uint32
- Pltime uint32
- }
- type ifreqAlias4 struct {
- Name [unix.IFNAMSIZ]byte
- Addr unix.RawSockaddrInet4
- DstAddr unix.RawSockaddrInet4
- MaskAddr unix.RawSockaddrInet4
- }
- type ifreqAlias6 struct {
- Name [unix.IFNAMSIZ]byte
- Addr unix.RawSockaddrInet6
- DstAddr unix.RawSockaddrInet6
- PrefixMask unix.RawSockaddrInet6
- Flags uint32
- Lifetime addrLifetime
- }
- func newTun(c *config.C, l *logrus.Logger, vpnNetworks []netip.Prefix, _ bool) (*tun, error) {
- name := c.GetString("tun.dev", "")
- ifIndex := -1
- if name != "" && name != "utun" {
- _, err := fmt.Sscanf(name, "utun%d", &ifIndex)
- if err != nil || ifIndex < 0 {
- // NOTE: we don't make this error so we don't break existing
- // configs that set a name before it was used.
- l.Warn("interface name must be utun[0-9]+ on Darwin, ignoring")
- ifIndex = -1
- }
- }
- fd, err := unix.Socket(unix.AF_SYSTEM, unix.SOCK_DGRAM, unix.AF_SYS_CONTROL)
- if err != nil {
- return nil, fmt.Errorf("system socket: %v", err)
- }
- var ctlInfo = &unix.CtlInfo{}
- copy(ctlInfo.Name[:], utunControlName)
- err = unix.IoctlCtlInfo(fd, ctlInfo)
- if err != nil {
- return nil, fmt.Errorf("CTLIOCGINFO: %v", err)
- }
- err = unix.Connect(fd, &unix.SockaddrCtl{
- ID: ctlInfo.Id,
- Unit: uint32(ifIndex) + 1,
- })
- if err != nil {
- return nil, fmt.Errorf("SYS_CONNECT: %v", err)
- }
- name, err = unix.GetsockoptString(fd, unix.AF_SYS_CONTROL, _UTUN_OPT_IFNAME)
- if err != nil {
- return nil, fmt.Errorf("failed to retrieve tun name: %w", err)
- }
- err = unix.SetNonblock(fd, true)
- if err != nil {
- return nil, fmt.Errorf("SetNonblock: %v", err)
- }
- t := &tun{
- ReadWriteCloser: os.NewFile(uintptr(fd), ""),
- Device: name,
- vpnNetworks: vpnNetworks,
- DefaultMTU: c.GetInt("tun.mtu", DefaultMTU),
- l: l,
- }
- err = t.reload(c, true)
- if err != nil {
- return nil, err
- }
- c.RegisterReloadCallback(func(c *config.C) {
- err := t.reload(c, false)
- if err != nil {
- util.LogWithContextIfNeeded("failed to reload tun device", err, t.l)
- }
- })
- return t, nil
- }
- func (t *tun) deviceBytes() (o [16]byte) {
- for i, c := range t.Device {
- o[i] = byte(c)
- }
- return
- }
- func newTunFromFd(_ *config.C, _ *logrus.Logger, _ int, _ []netip.Prefix) (*tun, error) {
- return nil, fmt.Errorf("newTunFromFd not supported in Darwin")
- }
- func (t *tun) Close() error {
- if t.ReadWriteCloser != nil {
- return t.ReadWriteCloser.Close()
- }
- return nil
- }
- func (t *tun) Activate() error {
- devName := t.deviceBytes()
- s, err := unix.Socket(
- unix.AF_INET,
- unix.SOCK_DGRAM,
- unix.IPPROTO_IP,
- )
- if err != nil {
- return err
- }
- defer unix.Close(s)
- fd := uintptr(s)
- // Set the MTU on the device
- ifm := ifreqMTU{Name: devName, MTU: int32(t.DefaultMTU)}
- if err = ioctl(fd, unix.SIOCSIFMTU, uintptr(unsafe.Pointer(&ifm))); err != nil {
- return fmt.Errorf("failed to set tun mtu: %v", err)
- }
- // Get the device flags
- ifrf := ifReq{Name: devName}
- if err = ioctl(fd, unix.SIOCGIFFLAGS, uintptr(unsafe.Pointer(&ifrf))); err != nil {
- return fmt.Errorf("failed to get tun flags: %s", err)
- }
- linkAddr, err := getLinkAddr(t.Device)
- if err != nil {
- return err
- }
- if linkAddr == nil {
- return fmt.Errorf("unable to discover link_addr for tun interface")
- }
- t.linkAddr = linkAddr
- for _, network := range t.vpnNetworks {
- if network.Addr().Is4() {
- err = t.activate4(network)
- if err != nil {
- return err
- }
- } else {
- err = t.activate6(network)
- if err != nil {
- return err
- }
- }
- }
- // Run the interface
- ifrf.Flags = ifrf.Flags | unix.IFF_UP | unix.IFF_RUNNING
- if err = ioctl(fd, unix.SIOCSIFFLAGS, uintptr(unsafe.Pointer(&ifrf))); err != nil {
- return fmt.Errorf("failed to run tun device: %s", err)
- }
- // Unsafe path routes
- return t.addRoutes(false)
- }
- func (t *tun) activate4(network netip.Prefix) error {
- s, err := unix.Socket(
- unix.AF_INET,
- unix.SOCK_DGRAM,
- unix.IPPROTO_IP,
- )
- if err != nil {
- return err
- }
- defer unix.Close(s)
- ifr := ifreqAlias4{
- Name: t.deviceBytes(),
- Addr: unix.RawSockaddrInet4{
- Len: unix.SizeofSockaddrInet4,
- Family: unix.AF_INET,
- Addr: network.Addr().As4(),
- },
- DstAddr: unix.RawSockaddrInet4{
- Len: unix.SizeofSockaddrInet4,
- Family: unix.AF_INET,
- Addr: network.Addr().As4(),
- },
- MaskAddr: unix.RawSockaddrInet4{
- Len: unix.SizeofSockaddrInet4,
- Family: unix.AF_INET,
- Addr: prefixToMask(network).As4(),
- },
- }
- if err := ioctl(uintptr(s), unix.SIOCAIFADDR, uintptr(unsafe.Pointer(&ifr))); err != nil {
- return fmt.Errorf("failed to set tun v4 address: %s", err)
- }
- err = addRoute(network, t.linkAddr)
- if err != nil {
- return err
- }
- return nil
- }
- func (t *tun) activate6(network netip.Prefix) error {
- s, err := unix.Socket(
- unix.AF_INET6,
- unix.SOCK_DGRAM,
- unix.IPPROTO_IP,
- )
- if err != nil {
- return err
- }
- defer unix.Close(s)
- ifr := ifreqAlias6{
- Name: t.deviceBytes(),
- Addr: unix.RawSockaddrInet6{
- Len: unix.SizeofSockaddrInet6,
- Family: unix.AF_INET6,
- Addr: network.Addr().As16(),
- },
- PrefixMask: unix.RawSockaddrInet6{
- Len: unix.SizeofSockaddrInet6,
- Family: unix.AF_INET6,
- Addr: prefixToMask(network).As16(),
- },
- Lifetime: addrLifetime{
- // never expires
- Vltime: 0xffffffff,
- Pltime: 0xffffffff,
- },
- //TODO: CERT-V2 should we disable DAD (duplicate address detection) and mark this as a secured address?
- Flags: _IN6_IFF_NODAD,
- }
- if err := ioctl(uintptr(s), _SIOCAIFADDR_IN6, uintptr(unsafe.Pointer(&ifr))); err != nil {
- return fmt.Errorf("failed to set tun address: %s", err)
- }
- return nil
- }
- func (t *tun) reload(c *config.C, initial bool) error {
- change, routes, err := getAllRoutesFromConfig(c, t.vpnNetworks, initial)
- if err != nil {
- return err
- }
- if !initial && !change {
- return nil
- }
- routeTree, err := makeRouteTree(t.l, routes, false)
- if err != nil {
- return err
- }
- // Teach nebula how to handle the routes before establishing them in the system table
- oldRoutes := t.Routes.Swap(&routes)
- t.routeTree.Store(routeTree)
- if !initial {
- // Remove first, if the system removes a wanted route hopefully it will be re-added next
- err := t.removeRoutes(findRemovedRoutes(routes, *oldRoutes))
- if err != nil {
- util.LogWithContextIfNeeded("Failed to remove routes", err, t.l)
- }
- // Ensure any routes we actually want are installed
- err = t.addRoutes(true)
- if err != nil {
- // Catch any stray logs
- util.LogWithContextIfNeeded("Failed to add routes", err, t.l)
- }
- }
- return nil
- }
- func (t *tun) RouteFor(ip netip.Addr) netip.Addr {
- r, ok := t.routeTree.Load().Lookup(ip)
- if ok {
- return r
- }
- return netip.Addr{}
- }
- // Get the LinkAddr for the interface of the given name
- // Is there an easier way to fetch this when we create the interface?
- // Maybe SIOCGIFINDEX? but this doesn't appear to exist in the darwin headers.
- func getLinkAddr(name string) (*netroute.LinkAddr, error) {
- rib, err := netroute.FetchRIB(unix.AF_UNSPEC, unix.NET_RT_IFLIST, 0)
- if err != nil {
- return nil, err
- }
- msgs, err := netroute.ParseRIB(unix.NET_RT_IFLIST, rib)
- if err != nil {
- return nil, err
- }
- for _, m := range msgs {
- switch m := m.(type) {
- case *netroute.InterfaceMessage:
- if m.Name == name {
- sa, ok := m.Addrs[unix.RTAX_IFP].(*netroute.LinkAddr)
- if ok {
- return sa, nil
- }
- }
- }
- }
- return nil, nil
- }
- func (t *tun) addRoutes(logErrors bool) error {
- routes := *t.Routes.Load()
- for _, r := range routes {
- if !r.Via.IsValid() || !r.Install {
- // We don't allow route MTUs so only install routes with a via
- continue
- }
- err := addRoute(r.Cidr, t.linkAddr)
- if err != nil {
- if errors.Is(err, unix.EEXIST) {
- t.l.WithField("route", r.Cidr).
- Warnf("unable to add unsafe_route, identical route already exists")
- } else {
- retErr := util.NewContextualError("Failed to add route", map[string]interface{}{"route": r}, err)
- if logErrors {
- retErr.Log(t.l)
- } else {
- return retErr
- }
- }
- } else {
- t.l.WithField("route", r).Info("Added route")
- }
- }
- return nil
- }
- func (t *tun) removeRoutes(routes []Route) error {
- for _, r := range routes {
- if !r.Install {
- continue
- }
- err := delRoute(r.Cidr, t.linkAddr)
- if err != nil {
- t.l.WithError(err).WithField("route", r).Error("Failed to remove route")
- } else {
- t.l.WithField("route", r).Info("Removed route")
- }
- }
- return nil
- }
- func addRoute(prefix netip.Prefix, gateway netroute.Addr) error {
- sock, err := unix.Socket(unix.AF_ROUTE, unix.SOCK_RAW, unix.AF_UNSPEC)
- if err != nil {
- return fmt.Errorf("unable to create AF_ROUTE socket: %v", err)
- }
- defer unix.Close(sock)
- route := &netroute.RouteMessage{
- Version: unix.RTM_VERSION,
- Type: unix.RTM_ADD,
- Flags: unix.RTF_UP,
- Seq: 1,
- }
- if prefix.Addr().Is4() {
- route.Addrs = []netroute.Addr{
- unix.RTAX_DST: &netroute.Inet4Addr{IP: prefix.Masked().Addr().As4()},
- unix.RTAX_NETMASK: &netroute.Inet4Addr{IP: prefixToMask(prefix).As4()},
- unix.RTAX_GATEWAY: gateway,
- }
- } else {
- route.Addrs = []netroute.Addr{
- unix.RTAX_DST: &netroute.Inet6Addr{IP: prefix.Masked().Addr().As16()},
- unix.RTAX_NETMASK: &netroute.Inet6Addr{IP: prefixToMask(prefix).As16()},
- unix.RTAX_GATEWAY: gateway,
- }
- }
- data, err := route.Marshal()
- if err != nil {
- return fmt.Errorf("failed to create route.RouteMessage: %w", err)
- }
- _, err = unix.Write(sock, data[:])
- if err != nil {
- return fmt.Errorf("failed to write route.RouteMessage to socket: %w", err)
- }
- return nil
- }
- func delRoute(prefix netip.Prefix, gateway netroute.Addr) error {
- sock, err := unix.Socket(unix.AF_ROUTE, unix.SOCK_RAW, unix.AF_UNSPEC)
- if err != nil {
- return fmt.Errorf("unable to create AF_ROUTE socket: %v", err)
- }
- defer unix.Close(sock)
- route := netroute.RouteMessage{
- Version: unix.RTM_VERSION,
- Type: unix.RTM_DELETE,
- Seq: 1,
- }
- if prefix.Addr().Is4() {
- route.Addrs = []netroute.Addr{
- unix.RTAX_DST: &netroute.Inet4Addr{IP: prefix.Masked().Addr().As4()},
- unix.RTAX_NETMASK: &netroute.Inet4Addr{IP: prefixToMask(prefix).As4()},
- unix.RTAX_GATEWAY: gateway,
- }
- } else {
- route.Addrs = []netroute.Addr{
- unix.RTAX_DST: &netroute.Inet6Addr{IP: prefix.Masked().Addr().As16()},
- unix.RTAX_NETMASK: &netroute.Inet6Addr{IP: prefixToMask(prefix).As16()},
- unix.RTAX_GATEWAY: gateway,
- }
- }
- data, err := route.Marshal()
- if err != nil {
- return fmt.Errorf("failed to create route.RouteMessage: %w", err)
- }
- _, err = unix.Write(sock, data[:])
- if err != nil {
- return fmt.Errorf("failed to write route.RouteMessage to socket: %w", err)
- }
- return nil
- }
- func (t *tun) Read(to []byte) (int, error) {
- buf := make([]byte, len(to)+4)
- n, err := t.ReadWriteCloser.Read(buf)
- copy(to, buf[4:])
- return n - 4, err
- }
- // Write is only valid for single threaded use
- func (t *tun) Write(from []byte) (int, error) {
- buf := t.out
- if cap(buf) < len(from)+4 {
- buf = make([]byte, len(from)+4)
- t.out = buf
- }
- buf = buf[:len(from)+4]
- if len(from) == 0 {
- return 0, syscall.EIO
- }
- // Determine the IP Family for the NULL L2 Header
- ipVer := from[0] >> 4
- if ipVer == 4 {
- buf[3] = syscall.AF_INET
- } else if ipVer == 6 {
- buf[3] = syscall.AF_INET6
- } else {
- return 0, fmt.Errorf("unable to determine IP version from packet")
- }
- copy(buf[4:], from)
- n, err := t.ReadWriteCloser.Write(buf)
- return n - 4, err
- }
- func (t *tun) Networks() []netip.Prefix {
- return t.vpnNetworks
- }
- func (t *tun) Name() string {
- return t.Device
- }
- func (t *tun) NewMultiQueueReader() (io.ReadWriteCloser, error) {
- return nil, fmt.Errorf("TODO: multiqueue not implemented for darwin")
- }
- func prefixToMask(prefix netip.Prefix) netip.Addr {
- pLen := 128
- if prefix.Addr().Is4() {
- pLen = 32
- }
- addr, _ := netip.AddrFromSlice(net.CIDRMask(prefix.Bits(), pLen))
- return addr
- }
|