123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549 |
- //go:build !e2e_testing
- // +build !e2e_testing
- package overlay
- import (
- "errors"
- "fmt"
- "io"
- "net/netip"
- "os"
- "regexp"
- "sync/atomic"
- "syscall"
- "unsafe"
- "github.com/gaissmai/bart"
- "github.com/sirupsen/logrus"
- "github.com/slackhq/nebula/config"
- "github.com/slackhq/nebula/routing"
- "github.com/slackhq/nebula/util"
- netroute "golang.org/x/net/route"
- "golang.org/x/sys/unix"
- )
- const (
- SIOCAIFADDR_IN6 = 0x8080696b
- TUNSIFHEAD = 0x80047442
- TUNSIFMODE = 0x80047458
- )
- type ifreqAlias4 struct {
- Name [unix.IFNAMSIZ]byte
- Addr unix.RawSockaddrInet4
- DstAddr unix.RawSockaddrInet4
- MaskAddr unix.RawSockaddrInet4
- }
- type ifreqAlias6 struct {
- Name [unix.IFNAMSIZ]byte
- Addr unix.RawSockaddrInet6
- DstAddr unix.RawSockaddrInet6
- PrefixMask unix.RawSockaddrInet6
- Flags uint32
- Lifetime addrLifetime
- }
- type ifreq struct {
- Name [unix.IFNAMSIZ]byte
- data int
- }
- type addrLifetime struct {
- Expire uint64
- Preferred uint64
- Vltime uint32
- Pltime uint32
- }
- type tun struct {
- Device string
- vpnNetworks []netip.Prefix
- MTU int
- Routes atomic.Pointer[[]Route]
- routeTree atomic.Pointer[bart.Table[routing.Gateways]]
- l *logrus.Logger
- f *os.File
- fd int
- }
- var deviceNameRE = regexp.MustCompile(`^tun[0-9]+$`)
- func newTunFromFd(_ *config.C, _ *logrus.Logger, _ int, _ []netip.Prefix) (*tun, error) {
- return nil, fmt.Errorf("newTunFromFd not supported in NetBSD")
- }
- func newTun(c *config.C, l *logrus.Logger, vpnNetworks []netip.Prefix, _ bool) (*tun, error) {
- // Try to open tun device
- var err error
- deviceName := c.GetString("tun.dev", "")
- if deviceName == "" {
- return nil, fmt.Errorf("a device name in the format of /dev/tunN must be specified")
- }
- if !deviceNameRE.MatchString(deviceName) {
- return nil, fmt.Errorf("a device name in the format of /dev/tunN must be specified")
- }
- fd, err := unix.Open("/dev/"+deviceName, os.O_RDWR, 0)
- if err != nil {
- return nil, err
- }
- err = unix.SetNonblock(fd, true)
- if err != nil {
- l.WithError(err).Warn("Failed to set the tun device as nonblocking")
- }
- t := &tun{
- f: os.NewFile(uintptr(fd), ""),
- fd: fd,
- Device: deviceName,
- vpnNetworks: vpnNetworks,
- MTU: c.GetInt("tun.mtu", DefaultMTU),
- l: l,
- }
- err = t.reload(c, true)
- if err != nil {
- return nil, err
- }
- c.RegisterReloadCallback(func(c *config.C) {
- err := t.reload(c, false)
- if err != nil {
- util.LogWithContextIfNeeded("failed to reload tun device", err, t.l)
- }
- })
- return t, nil
- }
- func (t *tun) Close() error {
- if t.f != nil {
- if err := t.f.Close(); err != nil {
- return fmt.Errorf("error closing tun file: %w", err)
- }
- // t.f.Close should have handled it for us but let's be extra sure
- _ = unix.Close(t.fd)
- s, err := syscall.Socket(syscall.AF_INET, syscall.SOCK_DGRAM, syscall.IPPROTO_IP)
- if err != nil {
- return err
- }
- defer syscall.Close(s)
- ifr := ifreq{Name: t.deviceBytes()}
- err = ioctl(uintptr(s), syscall.SIOCIFDESTROY, uintptr(unsafe.Pointer(&ifr)))
- return err
- }
- return nil
- }
- func (t *tun) Read(to []byte) (int, error) {
- rc, err := t.f.SyscallConn()
- if err != nil {
- return 0, fmt.Errorf("failed to get syscall conn for tun: %w", err)
- }
- var errno syscall.Errno
- var n uintptr
- err = rc.Read(func(fd uintptr) bool {
- // first 4 bytes is protocol family, in network byte order
- head := [4]byte{}
- iovecs := []syscall.Iovec{
- {&head[0], 4},
- {&to[0], uint64(len(to))},
- }
- n, _, errno = syscall.Syscall(syscall.SYS_READV, fd, uintptr(unsafe.Pointer(&iovecs[0])), uintptr(2))
- if errno.Temporary() {
- // We got an EAGAIN, EINTR, or EWOULDBLOCK, go again
- return false
- }
- return true
- })
- if err != nil {
- if err == syscall.EBADF || err.Error() == "use of closed file" {
- // Go doesn't export poll.ErrFileClosing but happily reports it to us so here we are
- // https://github.com/golang/go/blob/master/src/internal/poll/fd_poll_runtime.go#L121
- return 0, os.ErrClosed
- }
- return 0, fmt.Errorf("failed to make read call for tun: %w", err)
- }
- if errno != 0 {
- return 0, fmt.Errorf("failed to make inner read call for tun: %w", errno)
- }
- // fix bytes read number to exclude header
- bytesRead := int(n)
- if bytesRead < 0 {
- return bytesRead, nil
- } else if bytesRead < 4 {
- return 0, nil
- } else {
- return bytesRead - 4, nil
- }
- }
- // Write is only valid for single threaded use
- func (t *tun) Write(from []byte) (int, error) {
- if len(from) <= 1 {
- return 0, syscall.EIO
- }
- ipVer := from[0] >> 4
- var head [4]byte
- // first 4 bytes is protocol family, in network byte order
- if ipVer == 4 {
- head[3] = syscall.AF_INET
- } else if ipVer == 6 {
- head[3] = syscall.AF_INET6
- } else {
- return 0, fmt.Errorf("unable to determine IP version from packet")
- }
- rc, err := t.f.SyscallConn()
- if err != nil {
- return 0, err
- }
- var errno syscall.Errno
- var n uintptr
- err = rc.Write(func(fd uintptr) bool {
- iovecs := []syscall.Iovec{
- {&head[0], 4},
- {&from[0], uint64(len(from))},
- }
- n, _, errno = syscall.Syscall(syscall.SYS_WRITEV, fd, uintptr(unsafe.Pointer(&iovecs[0])), uintptr(2))
- // According to NetBSD documentation for TUN, writes will only return errors in which
- // this packet will never be delivered so just go on living life.
- return true
- })
- if err != nil {
- return 0, err
- }
- if errno != 0 {
- return 0, errno
- }
- return int(n) - 4, err
- }
- func (t *tun) addIp(cidr netip.Prefix) error {
- if cidr.Addr().Is4() {
- var req ifreqAlias4
- req.Name = t.deviceBytes()
- req.Addr = unix.RawSockaddrInet4{
- Len: unix.SizeofSockaddrInet4,
- Family: unix.AF_INET,
- Addr: cidr.Addr().As4(),
- }
- req.DstAddr = unix.RawSockaddrInet4{
- Len: unix.SizeofSockaddrInet4,
- Family: unix.AF_INET,
- Addr: cidr.Addr().As4(),
- }
- req.MaskAddr = unix.RawSockaddrInet4{
- Len: unix.SizeofSockaddrInet4,
- Family: unix.AF_INET,
- Addr: prefixToMask(cidr).As4(),
- }
- s, err := unix.Socket(unix.AF_INET, unix.SOCK_DGRAM, unix.IPPROTO_IP)
- if err != nil {
- return err
- }
- defer syscall.Close(s)
- if err := ioctl(uintptr(s), unix.SIOCAIFADDR, uintptr(unsafe.Pointer(&req))); err != nil {
- return fmt.Errorf("failed to set tun address %s: %s", cidr.Addr(), err)
- }
- return nil
- }
- if cidr.Addr().Is6() {
- var req ifreqAlias6
- req.Name = t.deviceBytes()
- req.Addr = unix.RawSockaddrInet6{
- Len: unix.SizeofSockaddrInet6,
- Family: unix.AF_INET6,
- Addr: cidr.Addr().As16(),
- }
- req.PrefixMask = unix.RawSockaddrInet6{
- Len: unix.SizeofSockaddrInet6,
- Family: unix.AF_INET6,
- Addr: prefixToMask(cidr).As16(),
- }
- req.Lifetime = addrLifetime{
- Vltime: 0xffffffff,
- Pltime: 0xffffffff,
- }
- s, err := unix.Socket(unix.AF_INET6, unix.SOCK_DGRAM, unix.IPPROTO_IP)
- if err != nil {
- return err
- }
- defer syscall.Close(s)
- if err := ioctl(uintptr(s), SIOCAIFADDR_IN6, uintptr(unsafe.Pointer(&req))); err != nil {
- return fmt.Errorf("failed to set tun address %s: %s", cidr.Addr().String(), err)
- }
- return nil
- }
- return fmt.Errorf("unknown address type %v", cidr)
- }
- func (t *tun) Activate() error {
- mode := int32(unix.IFF_BROADCAST)
- err := ioctl(uintptr(t.fd), TUNSIFMODE, uintptr(unsafe.Pointer(&mode)))
- if err != nil {
- return fmt.Errorf("failed to set tun device mode: %w", err)
- }
- v := 1
- err = ioctl(uintptr(t.fd), TUNSIFHEAD, uintptr(unsafe.Pointer(&v)))
- if err != nil {
- return fmt.Errorf("failed to set tun device head: %w", err)
- }
- err = t.doIoctlByName(unix.SIOCSIFMTU, uint32(t.MTU))
- if err != nil {
- return fmt.Errorf("failed to set tun mtu: %w", err)
- }
- for i := range t.vpnNetworks {
- err = t.addIp(t.vpnNetworks[i])
- if err != nil {
- return err
- }
- }
- return t.addRoutes(false)
- }
- func (t *tun) doIoctlByName(ctl uintptr, value uint32) error {
- s, err := unix.Socket(unix.AF_INET, unix.SOCK_DGRAM, unix.IPPROTO_IP)
- if err != nil {
- return err
- }
- defer syscall.Close(s)
- ir := ifreq{Name: t.deviceBytes(), data: int(value)}
- err = ioctl(uintptr(s), ctl, uintptr(unsafe.Pointer(&ir)))
- return err
- }
- func (t *tun) reload(c *config.C, initial bool) error {
- change, routes, err := getAllRoutesFromConfig(c, t.vpnNetworks, initial)
- if err != nil {
- return err
- }
- if !initial && !change {
- return nil
- }
- routeTree, err := makeRouteTree(t.l, routes, false)
- if err != nil {
- return err
- }
- // Teach nebula how to handle the routes before establishing them in the system table
- oldRoutes := t.Routes.Swap(&routes)
- t.routeTree.Store(routeTree)
- if !initial {
- // Remove first, if the system removes a wanted route hopefully it will be re-added next
- err := t.removeRoutes(findRemovedRoutes(routes, *oldRoutes))
- if err != nil {
- util.LogWithContextIfNeeded("Failed to remove routes", err, t.l)
- }
- // Ensure any routes we actually want are installed
- err = t.addRoutes(true)
- if err != nil {
- // Catch any stray logs
- util.LogWithContextIfNeeded("Failed to add routes", err, t.l)
- }
- }
- return nil
- }
- func (t *tun) RoutesFor(ip netip.Addr) routing.Gateways {
- r, _ := t.routeTree.Load().Lookup(ip)
- return r
- }
- func (t *tun) Networks() []netip.Prefix {
- return t.vpnNetworks
- }
- func (t *tun) Name() string {
- return t.Device
- }
- func (t *tun) NewMultiQueueReader() (io.ReadWriteCloser, error) {
- return nil, fmt.Errorf("TODO: multiqueue not implemented for netbsd")
- }
- func (t *tun) addRoutes(logErrors bool) error {
- routes := *t.Routes.Load()
- for _, r := range routes {
- if len(r.Via) == 0 || !r.Install {
- // We don't allow route MTUs so only install routes with a via
- continue
- }
- err := addRoute(r.Cidr, t.vpnNetworks)
- if err != nil {
- retErr := util.NewContextualError("Failed to add route", map[string]any{"route": r}, err)
- if logErrors {
- retErr.Log(t.l)
- } else {
- return retErr
- }
- } else {
- t.l.WithField("route", r).Info("Added route")
- }
- }
- return nil
- }
- func (t *tun) removeRoutes(routes []Route) error {
- for _, r := range routes {
- if !r.Install {
- continue
- }
- err := delRoute(r.Cidr, t.vpnNetworks)
- if err != nil {
- t.l.WithError(err).WithField("route", r).Error("Failed to remove route")
- } else {
- t.l.WithField("route", r).Info("Removed route")
- }
- }
- return nil
- }
- func (t *tun) deviceBytes() (o [16]byte) {
- for i, c := range t.Device {
- o[i] = byte(c)
- }
- return
- }
- func addRoute(prefix netip.Prefix, gateways []netip.Prefix) error {
- sock, err := unix.Socket(unix.AF_ROUTE, unix.SOCK_RAW, unix.AF_UNSPEC)
- if err != nil {
- return fmt.Errorf("unable to create AF_ROUTE socket: %v", err)
- }
- defer unix.Close(sock)
- route := &netroute.RouteMessage{
- Version: unix.RTM_VERSION,
- Type: unix.RTM_ADD,
- Flags: unix.RTF_UP | unix.RTF_GATEWAY,
- Seq: 1,
- }
- if prefix.Addr().Is4() {
- gw, err := selectGateway(prefix, gateways)
- if err != nil {
- return err
- }
- route.Addrs = []netroute.Addr{
- unix.RTAX_DST: &netroute.Inet4Addr{IP: prefix.Masked().Addr().As4()},
- unix.RTAX_NETMASK: &netroute.Inet4Addr{IP: prefixToMask(prefix).As4()},
- unix.RTAX_GATEWAY: &netroute.Inet4Addr{IP: gw.Addr().As4()},
- }
- } else {
- gw, err := selectGateway(prefix, gateways)
- if err != nil {
- return err
- }
- route.Addrs = []netroute.Addr{
- unix.RTAX_DST: &netroute.Inet6Addr{IP: prefix.Masked().Addr().As16()},
- unix.RTAX_NETMASK: &netroute.Inet6Addr{IP: prefixToMask(prefix).As16()},
- unix.RTAX_GATEWAY: &netroute.Inet6Addr{IP: gw.Addr().As16()},
- }
- }
- data, err := route.Marshal()
- if err != nil {
- return fmt.Errorf("failed to create route.RouteMessage: %w", err)
- }
- _, err = unix.Write(sock, data[:])
- if err != nil {
- if errors.Is(err, unix.EEXIST) {
- // Try to do a change
- route.Type = unix.RTM_CHANGE
- data, err = route.Marshal()
- if err != nil {
- return fmt.Errorf("failed to create route.RouteMessage for change: %w", err)
- }
- _, err = unix.Write(sock, data[:])
- return err
- }
- return fmt.Errorf("failed to write route.RouteMessage to socket: %w", err)
- }
- return nil
- }
- func delRoute(prefix netip.Prefix, gateways []netip.Prefix) error {
- sock, err := unix.Socket(unix.AF_ROUTE, unix.SOCK_RAW, unix.AF_UNSPEC)
- if err != nil {
- return fmt.Errorf("unable to create AF_ROUTE socket: %v", err)
- }
- defer unix.Close(sock)
- route := netroute.RouteMessage{
- Version: unix.RTM_VERSION,
- Type: unix.RTM_DELETE,
- Seq: 1,
- }
- if prefix.Addr().Is4() {
- gw, err := selectGateway(prefix, gateways)
- if err != nil {
- return err
- }
- route.Addrs = []netroute.Addr{
- unix.RTAX_DST: &netroute.Inet4Addr{IP: prefix.Masked().Addr().As4()},
- unix.RTAX_NETMASK: &netroute.Inet4Addr{IP: prefixToMask(prefix).As4()},
- unix.RTAX_GATEWAY: &netroute.Inet4Addr{IP: gw.Addr().As4()},
- }
- } else {
- gw, err := selectGateway(prefix, gateways)
- if err != nil {
- return err
- }
- route.Addrs = []netroute.Addr{
- unix.RTAX_DST: &netroute.Inet6Addr{IP: prefix.Masked().Addr().As16()},
- unix.RTAX_NETMASK: &netroute.Inet6Addr{IP: prefixToMask(prefix).As16()},
- unix.RTAX_GATEWAY: &netroute.Inet6Addr{IP: gw.Addr().As16()},
- }
- }
- data, err := route.Marshal()
- if err != nil {
- return fmt.Errorf("failed to create route.RouteMessage: %w", err)
- }
- _, err = unix.Write(sock, data[:])
- if err != nil {
- return fmt.Errorf("failed to write route.RouteMessage to socket: %w", err)
- }
- return nil
- }
|