2020-05-29 01:43:15 +01:00
|
|
|
// Copyright (c) 2020 Tailscale Inc & AUTHORS All rights reserved.
|
|
|
|
// Use of this source code is governed by a BSD-style
|
|
|
|
// license that can be found in the LICENSE file.
|
|
|
|
|
|
|
|
package netns
|
|
|
|
|
|
|
|
import (
|
2020-05-31 23:36:10 +01:00
|
|
|
"bufio"
|
|
|
|
"bytes"
|
2020-05-31 09:31:01 +01:00
|
|
|
"errors"
|
2020-05-31 22:35:30 +01:00
|
|
|
"flag"
|
2020-05-29 01:43:15 +01:00
|
|
|
"fmt"
|
2020-05-31 23:36:10 +01:00
|
|
|
"io"
|
2020-05-30 05:58:31 +01:00
|
|
|
"os"
|
2020-05-31 09:31:01 +01:00
|
|
|
"os/exec"
|
|
|
|
"strings"
|
|
|
|
"sync"
|
2020-05-29 01:43:15 +01:00
|
|
|
"syscall"
|
|
|
|
|
|
|
|
"golang.org/x/sys/unix"
|
|
|
|
)
|
|
|
|
|
|
|
|
// tailscaleBypassMark is the mark indicating that packets originating
|
|
|
|
// from a socket should bypass Tailscale-managed routes during routing
|
|
|
|
// table lookups.
|
|
|
|
//
|
|
|
|
// Keep this in sync with tailscaleBypassMark in
|
|
|
|
// wgengine/router/router_linux.go.
|
|
|
|
const tailscaleBypassMark = 0x20000
|
|
|
|
|
2020-05-31 22:01:20 +01:00
|
|
|
// ipRuleOnce is the sync.Once & cached value for ipRuleAvailable.
|
|
|
|
var ipRuleOnce struct {
|
|
|
|
sync.Once
|
|
|
|
v bool
|
|
|
|
}
|
2020-05-31 09:31:01 +01:00
|
|
|
|
2020-05-31 22:01:20 +01:00
|
|
|
// ipRuleAvailable reports whether the 'ip rule' command works.
|
2020-05-31 09:31:01 +01:00
|
|
|
// If it doesn't, we have to use SO_BINDTODEVICE on our sockets instead.
|
2020-05-31 22:01:20 +01:00
|
|
|
func ipRuleAvailable() bool {
|
|
|
|
ipRuleOnce.Do(func() {
|
|
|
|
ipRuleOnce.v = exec.Command("ip", "rule").Run() == nil
|
|
|
|
})
|
|
|
|
return ipRuleOnce.v
|
|
|
|
}
|
2020-05-31 09:31:01 +01:00
|
|
|
|
2020-05-31 23:36:10 +01:00
|
|
|
var zeroRouteBytes = []byte("00000000")
|
|
|
|
|
2020-05-31 09:31:01 +01:00
|
|
|
// defaultRouteInterface returns the name of the network interface that owns
|
|
|
|
// the default route, not including any tailscale interfaces. We only use
|
|
|
|
// this in SO_BINDTODEVICE mode.
|
|
|
|
func defaultRouteInterface() (string, error) {
|
2020-05-31 23:36:10 +01:00
|
|
|
f, err := os.Open("/proc/net/route")
|
2020-05-31 09:31:01 +01:00
|
|
|
if err != nil {
|
|
|
|
return "", err
|
|
|
|
}
|
2020-05-31 23:36:10 +01:00
|
|
|
defer f.Close()
|
|
|
|
br := bufio.NewReaderSize(f, 128)
|
|
|
|
for {
|
|
|
|
line, err := br.ReadSlice('\n')
|
|
|
|
if err == io.EOF {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
if err != nil {
|
|
|
|
return "", err
|
|
|
|
}
|
|
|
|
if !bytes.Contains(line, zeroRouteBytes) {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
fields := strings.Fields(string(line))
|
2020-05-31 09:31:01 +01:00
|
|
|
ifc := fields[0]
|
|
|
|
ip := fields[1]
|
|
|
|
netmask := fields[7]
|
|
|
|
|
|
|
|
if strings.HasPrefix(ifc, "tailscale") ||
|
|
|
|
strings.HasPrefix(ifc, "wg") {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if ip == "00000000" && netmask == "00000000" {
|
|
|
|
// default route
|
|
|
|
return ifc, nil // interface name
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return "", errors.New("no default routes found")
|
|
|
|
}
|
|
|
|
|
|
|
|
// ignoreErrors returns true if we should ignore setsocketopt errors in
|
|
|
|
// this instance.
|
|
|
|
func ignoreErrors() bool {
|
2020-05-31 22:35:30 +01:00
|
|
|
// If we're in a test, ignore errors. Assume the test knows
|
|
|
|
// what it's doing and will do its own skips or permission
|
|
|
|
// checks if it's setting up a world that needs netns to work.
|
|
|
|
// But by default, assume that tests don't need netns and it's
|
|
|
|
// harmless to ignore the sockopts failing.
|
|
|
|
if flag.CommandLine.Lookup("test.v") != nil {
|
|
|
|
return true
|
|
|
|
}
|
2020-05-31 09:31:01 +01:00
|
|
|
if os.Getuid() != 0 {
|
|
|
|
// only root can manipulate these socket flags
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
2020-05-29 01:43:15 +01:00
|
|
|
// control marks c as necessary to dial in a separate network namespace.
|
|
|
|
//
|
|
|
|
// It's intentionally the same signature as net.Dialer.Control
|
|
|
|
// and net.ListenConfig.Control.
|
|
|
|
func control(network, address string, c syscall.RawConn) error {
|
2020-05-31 22:29:54 +01:00
|
|
|
var sockErr error
|
|
|
|
err := c.Control(func(fd uintptr) {
|
|
|
|
if ipRuleAvailable() {
|
|
|
|
sockErr = setBypassMark(fd)
|
|
|
|
} else {
|
|
|
|
sockErr = bindToDevice(fd)
|
2020-05-30 05:58:31 +01:00
|
|
|
}
|
2020-05-31 22:29:54 +01:00
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("RawConn.Control on %T: %w", c, err)
|
|
|
|
}
|
|
|
|
if sockErr != nil && ignoreErrors() {
|
|
|
|
// TODO(bradfitz): maybe log once? probably too spammy for e.g. CLI tools like tailscale netcheck.
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
return sockErr
|
|
|
|
}
|
|
|
|
|
|
|
|
func setBypassMark(fd uintptr) error {
|
|
|
|
if err := unix.SetsockoptInt(int(fd), unix.SOL_SOCKET, unix.SO_MARK, tailscaleBypassMark); err != nil {
|
|
|
|
return fmt.Errorf("setting SO_MARK bypass: %w", err)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func bindToDevice(fd uintptr) error {
|
|
|
|
ifc, err := defaultRouteInterface()
|
|
|
|
if err != nil {
|
|
|
|
// Make sure we bind to *some* interface,
|
|
|
|
// or we could get a routing loop.
|
|
|
|
// "lo" is always wrong, but if we don't have
|
|
|
|
// a default route anyway, it doesn't matter.
|
|
|
|
ifc = "lo"
|
|
|
|
}
|
|
|
|
if err := unix.SetsockoptString(int(fd), unix.SOL_SOCKET, unix.SO_BINDTODEVICE, ifc); err != nil {
|
|
|
|
return fmt.Errorf("setting SO_BINDTODEVICE: %w", err)
|
2020-05-29 01:43:15 +01:00
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|