tun_linux.go 7.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320
  1. //go:build !android && !e2e_testing
  2. // +build !android,!e2e_testing
  3. package overlay
  4. import (
  5. "fmt"
  6. "io"
  7. "net"
  8. "os"
  9. "strings"
  10. "unsafe"
  11. "github.com/sirupsen/logrus"
  12. "github.com/vishvananda/netlink"
  13. "golang.org/x/sys/unix"
  14. )
  15. type tun struct {
  16. io.ReadWriteCloser
  17. fd int
  18. Device string
  19. Cidr *net.IPNet
  20. MaxMTU int
  21. DefaultMTU int
  22. TXQueueLen int
  23. Routes []Route
  24. UnsafeRoutes []Route
  25. l *logrus.Logger
  26. }
  27. type ifReq struct {
  28. Name [16]byte
  29. Flags uint16
  30. pad [8]byte
  31. }
  32. func ioctl(a1, a2, a3 uintptr) error {
  33. _, _, errno := unix.Syscall(unix.SYS_IOCTL, a1, a2, a3)
  34. if errno != 0 {
  35. return errno
  36. }
  37. return nil
  38. }
  39. type ifreqAddr struct {
  40. Name [16]byte
  41. Addr unix.RawSockaddrInet4
  42. pad [8]byte
  43. }
  44. type ifreqMTU struct {
  45. Name [16]byte
  46. MTU int32
  47. pad [8]byte
  48. }
  49. type ifreqQLEN struct {
  50. Name [16]byte
  51. Value int32
  52. pad [8]byte
  53. }
  54. func newTunFromFd(l *logrus.Logger, deviceFd int, cidr *net.IPNet, defaultMTU int, routes []Route, unsafeRoutes []Route, txQueueLen int) (*tun, error) {
  55. file := os.NewFile(uintptr(deviceFd), "/dev/net/tun")
  56. return &tun{
  57. ReadWriteCloser: file,
  58. fd: int(file.Fd()),
  59. Device: "tun0",
  60. Cidr: cidr,
  61. DefaultMTU: defaultMTU,
  62. TXQueueLen: txQueueLen,
  63. Routes: routes,
  64. UnsafeRoutes: unsafeRoutes,
  65. l: l,
  66. }, nil
  67. }
  68. func newTun(l *logrus.Logger, deviceName string, cidr *net.IPNet, defaultMTU int, routes []Route, unsafeRoutes []Route, txQueueLen int, multiqueue bool) (*tun, error) {
  69. fd, err := unix.Open("/dev/net/tun", os.O_RDWR, 0)
  70. if err != nil {
  71. return nil, err
  72. }
  73. var req ifReq
  74. req.Flags = uint16(unix.IFF_TUN | unix.IFF_NO_PI)
  75. if multiqueue {
  76. req.Flags |= unix.IFF_MULTI_QUEUE
  77. }
  78. copy(req.Name[:], deviceName)
  79. if err = ioctl(uintptr(fd), uintptr(unix.TUNSETIFF), uintptr(unsafe.Pointer(&req))); err != nil {
  80. return nil, err
  81. }
  82. name := strings.Trim(string(req.Name[:]), "\x00")
  83. file := os.NewFile(uintptr(fd), "/dev/net/tun")
  84. maxMTU := defaultMTU
  85. for _, r := range routes {
  86. if r.MTU > maxMTU {
  87. maxMTU = r.MTU
  88. }
  89. }
  90. return &tun{
  91. ReadWriteCloser: file,
  92. fd: int(file.Fd()),
  93. Device: name,
  94. Cidr: cidr,
  95. MaxMTU: maxMTU,
  96. DefaultMTU: defaultMTU,
  97. TXQueueLen: txQueueLen,
  98. Routes: routes,
  99. UnsafeRoutes: unsafeRoutes,
  100. l: l,
  101. }, nil
  102. }
  103. func (t *tun) NewMultiQueueReader() (io.ReadWriteCloser, error) {
  104. fd, err := unix.Open("/dev/net/tun", os.O_RDWR, 0)
  105. if err != nil {
  106. return nil, err
  107. }
  108. var req ifReq
  109. req.Flags = uint16(unix.IFF_TUN | unix.IFF_NO_PI | unix.IFF_MULTI_QUEUE)
  110. copy(req.Name[:], t.Device)
  111. if err = ioctl(uintptr(fd), uintptr(unix.TUNSETIFF), uintptr(unsafe.Pointer(&req))); err != nil {
  112. return nil, err
  113. }
  114. file := os.NewFile(uintptr(fd), "/dev/net/tun")
  115. return file, nil
  116. }
  117. func (t *tun) WriteRaw(b []byte) error {
  118. var nn int
  119. for {
  120. max := len(b)
  121. n, err := unix.Write(t.fd, b[nn:max])
  122. if n > 0 {
  123. nn += n
  124. }
  125. if nn == len(b) {
  126. return err
  127. }
  128. if err != nil {
  129. return err
  130. }
  131. if n == 0 {
  132. return io.ErrUnexpectedEOF
  133. }
  134. }
  135. }
  136. func (t *tun) Write(b []byte) (int, error) {
  137. return len(b), t.WriteRaw(b)
  138. }
  139. func (t tun) deviceBytes() (o [16]byte) {
  140. for i, c := range t.Device {
  141. o[i] = byte(c)
  142. }
  143. return
  144. }
  145. func (t tun) Activate() error {
  146. devName := t.deviceBytes()
  147. var addr, mask [4]byte
  148. copy(addr[:], t.Cidr.IP.To4())
  149. copy(mask[:], t.Cidr.Mask)
  150. s, err := unix.Socket(
  151. unix.AF_INET,
  152. unix.SOCK_DGRAM,
  153. unix.IPPROTO_IP,
  154. )
  155. if err != nil {
  156. return err
  157. }
  158. fd := uintptr(s)
  159. ifra := ifreqAddr{
  160. Name: devName,
  161. Addr: unix.RawSockaddrInet4{
  162. Family: unix.AF_INET,
  163. Addr: addr,
  164. },
  165. }
  166. // Set the device ip address
  167. if err = ioctl(fd, unix.SIOCSIFADDR, uintptr(unsafe.Pointer(&ifra))); err != nil {
  168. return fmt.Errorf("failed to set tun address: %s", err)
  169. }
  170. // Set the device network
  171. ifra.Addr.Addr = mask
  172. if err = ioctl(fd, unix.SIOCSIFNETMASK, uintptr(unsafe.Pointer(&ifra))); err != nil {
  173. return fmt.Errorf("failed to set tun netmask: %s", err)
  174. }
  175. // Set the device name
  176. ifrf := ifReq{Name: devName}
  177. if err = ioctl(fd, unix.SIOCGIFFLAGS, uintptr(unsafe.Pointer(&ifrf))); err != nil {
  178. return fmt.Errorf("failed to set tun device name: %s", err)
  179. }
  180. // Set the MTU on the device
  181. ifm := ifreqMTU{Name: devName, MTU: int32(t.MaxMTU)}
  182. if err = ioctl(fd, unix.SIOCSIFMTU, uintptr(unsafe.Pointer(&ifm))); err != nil {
  183. // This is currently a non fatal condition because the route table must have the MTU set appropriately as well
  184. t.l.WithError(err).Error("Failed to set tun mtu")
  185. }
  186. // Set the transmit queue length
  187. ifrq := ifreqQLEN{Name: devName, Value: int32(t.TXQueueLen)}
  188. if err = ioctl(fd, unix.SIOCSIFTXQLEN, uintptr(unsafe.Pointer(&ifrq))); err != nil {
  189. // If we can't set the queue length nebula will still work but it may lead to packet loss
  190. t.l.WithError(err).Error("Failed to set tun tx queue length")
  191. }
  192. // Bring up the interface
  193. ifrf.Flags = ifrf.Flags | unix.IFF_UP
  194. if err = ioctl(fd, unix.SIOCSIFFLAGS, uintptr(unsafe.Pointer(&ifrf))); err != nil {
  195. return fmt.Errorf("failed to bring the tun device up: %s", err)
  196. }
  197. // Set the routes
  198. link, err := netlink.LinkByName(t.Device)
  199. if err != nil {
  200. return fmt.Errorf("failed to get tun device link: %s", err)
  201. }
  202. // Default route
  203. dr := &net.IPNet{IP: t.Cidr.IP.Mask(t.Cidr.Mask), Mask: t.Cidr.Mask}
  204. nr := netlink.Route{
  205. LinkIndex: link.Attrs().Index,
  206. Dst: dr,
  207. MTU: t.DefaultMTU,
  208. AdvMSS: t.advMSS(Route{}),
  209. Scope: unix.RT_SCOPE_LINK,
  210. Src: t.Cidr.IP,
  211. Protocol: unix.RTPROT_KERNEL,
  212. Table: unix.RT_TABLE_MAIN,
  213. Type: unix.RTN_UNICAST,
  214. }
  215. err = netlink.RouteReplace(&nr)
  216. if err != nil {
  217. return fmt.Errorf("failed to set mtu %v on the default route %v; %v", t.DefaultMTU, dr, err)
  218. }
  219. // Path routes
  220. for _, r := range t.Routes {
  221. nr := netlink.Route{
  222. LinkIndex: link.Attrs().Index,
  223. Dst: r.Cidr,
  224. MTU: r.MTU,
  225. AdvMSS: t.advMSS(r),
  226. Scope: unix.RT_SCOPE_LINK,
  227. }
  228. err = netlink.RouteAdd(&nr)
  229. if err != nil {
  230. return fmt.Errorf("failed to set mtu %v on route %v; %v", r.MTU, r.Cidr, err)
  231. }
  232. }
  233. // Unsafe path routes
  234. for _, r := range t.UnsafeRoutes {
  235. nr := netlink.Route{
  236. LinkIndex: link.Attrs().Index,
  237. Dst: r.Cidr,
  238. MTU: r.MTU,
  239. Priority: r.Metric,
  240. AdvMSS: t.advMSS(r),
  241. Scope: unix.RT_SCOPE_LINK,
  242. }
  243. err = netlink.RouteAdd(&nr)
  244. if err != nil {
  245. return fmt.Errorf("failed to set mtu %v on route %v; %v", r.MTU, r.Cidr, err)
  246. }
  247. }
  248. // Run the interface
  249. ifrf.Flags = ifrf.Flags | unix.IFF_UP | unix.IFF_RUNNING
  250. if err = ioctl(fd, unix.SIOCSIFFLAGS, uintptr(unsafe.Pointer(&ifrf))); err != nil {
  251. return fmt.Errorf("failed to run tun device: %s", err)
  252. }
  253. return nil
  254. }
  255. func (t *tun) CidrNet() *net.IPNet {
  256. return t.Cidr
  257. }
  258. func (t *tun) DeviceName() string {
  259. return t.Device
  260. }
  261. func (t tun) advMSS(r Route) int {
  262. mtu := r.MTU
  263. if r.MTU == 0 {
  264. mtu = t.DefaultMTU
  265. }
  266. // We only need to set advmss if the route MTU does not match the device MTU
  267. if mtu != t.MaxMTU {
  268. return mtu - 40
  269. }
  270. return 0
  271. }