tailscale/wgengine/netstack/netstack_test.go

// Copyright (c) Tailscale Inc & AUTHORS
// SPDX-License-Identifier: BSD-3-Clause

package netstack

import (
	"context"
	"fmt"
	"maps"
	"net"
	"net/netip"
	"runtime"
	"testing"
	"time"

	"gvisor.dev/gvisor/pkg/buffer"
	"gvisor.dev/gvisor/pkg/tcpip"
	"gvisor.dev/gvisor/pkg/tcpip/header"
	"gvisor.dev/gvisor/pkg/tcpip/stack"
	"tailscale.com/envknob"
	"tailscale.com/ipn"
	"tailscale.com/ipn/ipnlocal"
	"tailscale.com/ipn/store/mem"
	"tailscale.com/metrics"
	"tailscale.com/net/packet"
	"tailscale.com/net/tsaddr"
	"tailscale.com/net/tsdial"
	"tailscale.com/net/tstun"
	"tailscale.com/tsd"
	"tailscale.com/tstest"
	"tailscale.com/types/ipproto"
	"tailscale.com/types/logid"
	"tailscale.com/wgengine"
	"tailscale.com/wgengine/filter"
)

// TestInjectInboundLeak tests that injectInbound doesn't leak memory.
// See https://github.com/tailscale/tailscale/issues/3762
func TestInjectInboundLeak(t *testing.T) {
	tunDev := tstun.NewFake()
	dialer := new(tsdial.Dialer)
	logf := func(format string, args ...any) {
		if !t.Failed() {
			t.Logf(format, args...)
		}
	}
	sys := new(tsd.System)
	eng, err := wgengine.NewUserspaceEngine(logf, wgengine.Config{
		Tun:           tunDev,
		Dialer:        dialer,
		SetSubsystem:  sys.Set,
		HealthTracker: sys.HealthTracker(),
		Metrics:       sys.UserMetricsRegistry(),
	})
	if err != nil {
		t.Fatal(err)
	}
	defer eng.Close()
	sys.Set(eng)
	sys.Set(new(mem.Store))

	tunWrap := sys.Tun.Get()
	lb, err := ipnlocal.NewLocalBackend(logf, logid.PublicID{}, sys, 0)
	if err != nil {
		t.Fatal(err)
	}

	ns, err := Create(logf, tunWrap, eng, sys.MagicSock.Get(), dialer, sys.DNSManager.Get(), sys.ProxyMapper())
	if err != nil {
		t.Fatal(err)
	}
	defer ns.Close()
	ns.ProcessLocalIPs = true
	if err := ns.Start(lb); err != nil {
		t.Fatalf("Start: %v", err)
	}
	ns.atomicIsLocalIPFunc.Store(func(netip.Addr) bool { return true })

	pkt := &packet.Parsed{}
	const N = 10_000
	ms0 := getMemStats()
	for range N {
		outcome, _ := ns.injectInbound(pkt, tunWrap, nil)
		if outcome != filter.DropSilently {
			t.Fatalf("got outcome %v; want DropSilently", outcome)
		}
	}
	ms1 := getMemStats()
	if grew := int64(ms1.HeapObjects) - int64(ms0.HeapObjects); grew >= N {
		t.Fatalf("grew by %v (which is too much and >= the %v packets we sent)", grew, N)
	}
}

func getMemStats() (ms runtime.MemStats) {
	runtime.GC()
	runtime.ReadMemStats(&ms)
	return
}

func makeNetstack(tb testing.TB, config func(*Impl)) *Impl {
	tunDev := tstun.NewFake()
	sys := &tsd.System{}
	sys.Set(new(mem.Store))
	dialer := new(tsdial.Dialer)
	logf := tstest.WhileTestRunningLogger(tb)
	eng, err := wgengine.NewUserspaceEngine(logf, wgengine.Config{
		Tun:           tunDev,
		Dialer:        dialer,
		SetSubsystem:  sys.Set,
		HealthTracker: sys.HealthTracker(),
		Metrics:       sys.UserMetricsRegistry(),
	})
	if err != nil {
		tb.Fatal(err)
	}
	tb.Cleanup(func() { eng.Close() })
	sys.Set(eng)

	ns, err := Create(logf, sys.Tun.Get(), eng, sys.MagicSock.Get(), dialer, sys.DNSManager.Get(), sys.ProxyMapper())
	if err != nil {
		tb.Fatal(err)
	}
	tb.Cleanup(func() { ns.Close() })

	lb, err := ipnlocal.NewLocalBackend(logf, logid.PublicID{}, sys, 0)
	if err != nil {
		tb.Fatalf("NewLocalBackend: %v", err)
	}

	ns.atomicIsLocalIPFunc.Store(func(netip.Addr) bool { return true })
	if config != nil {
		config(ns)
	}
	if err := ns.Start(lb); err != nil {
		tb.Fatalf("Start: %v", err)
	}
	return ns
}

func TestShouldHandlePing(t *testing.T) {
	srcIP := netip.AddrFrom4([4]byte{1, 2, 3, 4})

	t.Run("ICMP4", func(t *testing.T) {
		dst := netip.MustParseAddr("5.6.7.8")
		icmph := packet.ICMP4Header{
			IP4Header: packet.IP4Header{
				IPProto: ipproto.ICMPv4,
				Src:     srcIP,
				Dst:     dst,
			},
			Type: packet.ICMP4EchoRequest,
			Code: packet.ICMP4NoCode,
		}
		_, payload := packet.ICMPEchoPayload(nil)
		icmpPing := packet.Generate(icmph, payload)
		pkt := &packet.Parsed{}
		pkt.Decode(icmpPing)

		impl := makeNetstack(t, func(impl *Impl) {
			impl.ProcessSubnets = true
		})
		pingDst, ok := impl.shouldHandlePing(pkt)
		if !ok {
			t.Errorf("expected shouldHandlePing==true")
		}
		if pingDst != dst {
			t.Errorf("got dst %s; want %s", pingDst, dst)
		}
	})

	t.Run("ICMP6-no-via", func(t *testing.T) {
		dst := netip.MustParseAddr("2a09:8280:1::4169")
		icmph := packet.ICMP6Header{
			IP6Header: packet.IP6Header{
				IPProto: ipproto.ICMPv6,
				Src:     srcIP,
				Dst:     dst,
			},
			Type: packet.ICMP6EchoRequest,
			Code: packet.ICMP6NoCode,
		}
		_, payload := packet.ICMPEchoPayload(nil)
		icmpPing := packet.Generate(icmph, payload)
		pkt := &packet.Parsed{}
		pkt.Decode(icmpPing)

		impl := makeNetstack(t, func(impl *Impl) {
			impl.ProcessSubnets = true
		})
		pingDst, ok := impl.shouldHandlePing(pkt)

		// Expect that we handle this since it's going out onto the
		// network.
		if !ok {
			t.Errorf("expected shouldHandlePing==true")
		}
		if pingDst != dst {
			t.Errorf("got dst %s; want %s", pingDst, dst)
		}
	})

	t.Run("ICMP6-tailscale-addr", func(t *testing.T) {
		dst := netip.MustParseAddr("fd7a:115c:a1e0:ab12::1")
		icmph := packet.ICMP6Header{
			IP6Header: packet.IP6Header{
				IPProto: ipproto.ICMPv6,
				Src:     srcIP,
				Dst:     dst,
			},
			Type: packet.ICMP6EchoRequest,
			Code: packet.ICMP6NoCode,
		}
		_, payload := packet.ICMPEchoPayload(nil)
		icmpPing := packet.Generate(icmph, payload)
		pkt := &packet.Parsed{}
		pkt.Decode(icmpPing)

		impl := makeNetstack(t, func(impl *Impl) {
			impl.ProcessSubnets = true
		})
		_, ok := impl.shouldHandlePing(pkt)

		// We don't handle this because it's a Tailscale IP and not 4via6
		if ok {
			t.Errorf("expected shouldHandlePing==false")
		}
	})

	// Handle pings for 4via6 addresses regardless of ProcessSubnets
	for _, subnets := range []bool{true, false} {
		t.Run("ICMP6-4via6-ProcessSubnets-"+fmt.Sprint(subnets), func(t *testing.T) {
			// The 4via6 route 10.1.1.0/24 siteid 7, and then the IP
			// 10.1.1.9 within that route.
			dst := netip.MustParseAddr("fd7a:115c:a1e0:b1a:0:7:a01:109")
			expectedPingDst := netip.MustParseAddr("10.1.1.9")
			icmph := packet.ICMP6Header{
				IP6Header: packet.IP6Header{
					IPProto: ipproto.ICMPv6,
					Src:     srcIP,
					Dst:     dst,
				},
				Type: packet.ICMP6EchoRequest,
				Code: packet.ICMP6NoCode,
			}
			_, payload := packet.ICMPEchoPayload(nil)
			icmpPing := packet.Generate(icmph, payload)
			pkt := &packet.Parsed{}
			pkt.Decode(icmpPing)

			impl := makeNetstack(t, func(impl *Impl) {
				impl.ProcessSubnets = subnets
			})
			pingDst, ok := impl.shouldHandlePing(pkt)

			// Handled due to being 4via6
			if !ok {
				t.Errorf("expected shouldHandlePing==true")
			} else if pingDst != expectedPingDst {
				t.Errorf("got dst %s; want %s", pingDst, expectedPingDst)
			}
		})
	}
}

// looksLikeATailscaleSelfAddress reports whether addr looks like
// a Tailscale self address, for tests.
func looksLikeATailscaleSelfAddress(addr netip.Addr) bool {
	return addr.Is4() && tsaddr.IsTailscaleIP(addr) ||
		addr.Is6() && tsaddr.Tailscale4To6Range().Contains(addr)
}

func TestShouldProcessInbound(t *testing.T) {
	testCases := []struct {
		name        string
		pkt         *packet.Parsed
		afterStart  func(*Impl) // optional; after Impl.Start is called
		beforeStart func(*Impl) // optional; before Impl.Start is called
		want        bool
		runOnGOOS   string
	}{
		{
			name: "ipv6-via",
			pkt: &packet.Parsed{
				IPVersion: 6,
				IPProto:   ipproto.TCP,
				Src:       netip.MustParseAddrPort("100.101.102.103:1234"),

				// $ tailscale debug via 7 10.1.1.9/24
				// fd7a:115c:a1e0:b1a:0:7:a01:109/120
				Dst:      netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:7:a01:109]:5678"),
				TCPFlags: packet.TCPSyn,
			},
			afterStart: func(i *Impl) {
				prefs := ipn.NewPrefs()
				prefs.AdvertiseRoutes = []netip.Prefix{
					// $ tailscale debug via 7 10.1.1.0/24
					// fd7a:115c:a1e0:b1a:0:7:a01:100/120
					netip.MustParsePrefix("fd7a:115c:a1e0:b1a:0:7:a01:100/120"),
				}
				i.lb.Start(ipn.Options{
					UpdatePrefs: prefs,
				})
				i.atomicIsLocalIPFunc.Store(looksLikeATailscaleSelfAddress)
			},
			beforeStart: func(i *Impl) {
				// This should be handled even if we're
				// otherwise not processing local IPs or
				// subnets.
				i.ProcessLocalIPs = false
				i.ProcessSubnets = false
			},
			want: true,
		},
		{
			name: "ipv6-via-not-advertised",
			pkt: &packet.Parsed{
				IPVersion: 6,
				IPProto:   ipproto.TCP,
				Src:       netip.MustParseAddrPort("100.101.102.103:1234"),

				// $ tailscale debug via 7 10.1.1.9/24
				// fd7a:115c:a1e0:b1a:0:7:a01:109/120
				Dst:      netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:7:a01:109]:5678"),
				TCPFlags: packet.TCPSyn,
			},
			afterStart: func(i *Impl) {
				prefs := ipn.NewPrefs()
				prefs.AdvertiseRoutes = []netip.Prefix{
					// tailscale debug via 7 10.1.2.0/24
					// fd7a:115c:a1e0:b1a:0:7:a01:200/120
					netip.MustParsePrefix("fd7a:115c:a1e0:b1a:0:7:a01:200/120"),
				}
				i.lb.Start(ipn.Options{
					UpdatePrefs: prefs,
				})
			},
			want: false,
		},
		{
			name: "tailscale-ssh-enabled",
			pkt: &packet.Parsed{
				IPVersion: 4,
				IPProto:   ipproto.TCP,
				Src:       netip.MustParseAddrPort("100.101.102.103:1234"),
				Dst:       netip.MustParseAddrPort("100.101.102.104:22"),
				TCPFlags:  packet.TCPSyn,
			},
			afterStart: func(i *Impl) {
				prefs := ipn.NewPrefs()
				prefs.RunSSH = true
				i.lb.Start(ipn.Options{
					UpdatePrefs: prefs,
				})
				i.atomicIsLocalIPFunc.Store(func(addr netip.Addr) bool {
					return addr.String() == "100.101.102.104" // Dst, above
				})
			},
			want:      true,
			runOnGOOS: "linux",
		},
		{
			name: "tailscale-ssh-disabled",
			pkt: &packet.Parsed{
				IPVersion: 4,
				IPProto:   ipproto.TCP,
				Src:       netip.MustParseAddrPort("100.101.102.103:1234"),
				Dst:       netip.MustParseAddrPort("100.101.102.104:22"),
				TCPFlags:  packet.TCPSyn,
			},
			afterStart: func(i *Impl) {
				prefs := ipn.NewPrefs()
				prefs.RunSSH = false // default, but to be explicit
				i.lb.Start(ipn.Options{
					UpdatePrefs: prefs,
				})
				i.atomicIsLocalIPFunc.Store(func(addr netip.Addr) bool {
					return addr.String() == "100.101.102.104" // Dst, above
				})
			},
			want: false,
		},
		{
			name: "process-local-ips",
			pkt: &packet.Parsed{
				IPVersion: 4,
				IPProto:   ipproto.TCP,
				Src:       netip.MustParseAddrPort("100.101.102.103:1234"),
				Dst:       netip.MustParseAddrPort("100.101.102.104:4567"),
				TCPFlags:  packet.TCPSyn,
			},
			afterStart: func(i *Impl) {
				i.ProcessLocalIPs = true
				i.atomicIsLocalIPFunc.Store(func(addr netip.Addr) bool {
					return addr.String() == "100.101.102.104" // Dst, above
				})
			},
			want: true,
		},
		{
			name: "process-subnets",
			pkt: &packet.Parsed{
				IPVersion: 4,
				IPProto:   ipproto.TCP,
				Src:       netip.MustParseAddrPort("100.101.102.103:1234"),
				Dst:       netip.MustParseAddrPort("10.1.2.3:4567"),
				TCPFlags:  packet.TCPSyn,
			},
			beforeStart: func(i *Impl) {
				i.ProcessSubnets = true
			},
			afterStart: func(i *Impl) {
				// For testing purposes, assume all Tailscale
				// IPs are local; the Dst above is something
				// not in that range.
				i.atomicIsLocalIPFunc.Store(looksLikeATailscaleSelfAddress)
			},
			want: true,
		},
		{
			name: "peerapi-port-subnet-router", // see #6235
			pkt: &packet.Parsed{
				IPVersion: 4,
				IPProto:   ipproto.TCP,
				Src:       netip.MustParseAddrPort("100.101.102.103:1234"),
				Dst:       netip.MustParseAddrPort("10.0.0.23:5555"),
				TCPFlags:  packet.TCPSyn,
			},
			beforeStart: func(i *Impl) {
				// As if we were running on Linux where netstack isn't used.
				i.ProcessSubnets = false
				i.atomicIsLocalIPFunc.Store(func(netip.Addr) bool { return false })
			},
			afterStart: func(i *Impl) {
				prefs := ipn.NewPrefs()
				prefs.AdvertiseRoutes = []netip.Prefix{
					netip.MustParsePrefix("10.0.0.1/24"),
				}
				i.lb.Start(ipn.Options{
					UpdatePrefs: prefs,
				})

				// Set the PeerAPI port to the Dst port above.
				i.peerapiPort4Atomic.Store(5555)
				i.peerapiPort6Atomic.Store(5555)
			},
			want: false,
		},

		// TODO(andrew): test PeerAPI
		// TODO(andrew): test TCP packets without the SYN flag set
	}

	for _, tc := range testCases {
		t.Run(tc.name, func(t *testing.T) {
			if tc.runOnGOOS != "" && runtime.GOOS != tc.runOnGOOS {
				t.Skipf("skipping on GOOS=%v", runtime.GOOS)
			}
			impl := makeNetstack(t, tc.beforeStart)
			if tc.afterStart != nil {
				tc.afterStart(impl)
			}

			got := impl.shouldProcessInbound(tc.pkt, nil)
			if got != tc.want {
				t.Errorf("got shouldProcessInbound()=%v; want %v", got, tc.want)
			} else {
				t.Logf("OK: shouldProcessInbound() = %v", got)
			}
		})
	}
}

func tcp4syn(tb testing.TB, src, dst netip.Addr, sport, dport uint16) []byte {
	ip := header.IPv4(make([]byte, header.IPv4MinimumSize+header.TCPMinimumSize))
	ip.Encode(&header.IPv4Fields{
		Protocol:    uint8(header.TCPProtocolNumber),
		TotalLength: header.IPv4MinimumSize + header.TCPMinimumSize,
		TTL:         64,
		SrcAddr:     tcpip.AddrFrom4Slice(src.AsSlice()),
		DstAddr:     tcpip.AddrFrom4Slice(dst.AsSlice()),
	})
	ip.SetChecksum(^ip.CalculateChecksum())
	if !ip.IsChecksumValid() {
		tb.Fatal("test broken; packet has incorrect IP checksum")
	}

	tcp := header.TCP(ip[header.IPv4MinimumSize:])
	tcp.Encode(&header.TCPFields{
		SrcPort:    sport,
		DstPort:    dport,
		SeqNum:     0,
		DataOffset: header.TCPMinimumSize,
		Flags:      header.TCPFlagSyn,
		WindowSize: 65535,
		Checksum:   0,
	})
	xsum := header.PseudoHeaderChecksum(
		header.TCPProtocolNumber,
		tcpip.AddrFrom4Slice(src.AsSlice()),
		tcpip.AddrFrom4Slice(dst.AsSlice()),
		uint16(header.TCPMinimumSize),
	)
	tcp.SetChecksum(^tcp.CalculateChecksum(xsum))
	if !tcp.IsChecksumValid(tcpip.AddrFrom4Slice(src.AsSlice()), tcpip.AddrFrom4Slice(dst.AsSlice()), 0, 0) {
		tb.Fatal("test broken; packet has incorrect TCP checksum")
	}

	return ip
}

// makeHangDialer returns a dialer that notifies the returned channel when a
// connection is dialed and then hangs until the test finishes.
func makeHangDialer(tb testing.TB) (func(context.Context, string, string) (net.Conn, error), chan struct{}) {
	done := make(chan struct{})
	tb.Cleanup(func() {
		close(done)
	})

	gotConn := make(chan struct{}, 1)
	fn := func(ctx context.Context, network, address string) (net.Conn, error) {
		// Signal that we have a new connection
		tb.Logf("hangDialer: called with network=%q address=%q", network, address)
		select {
		case gotConn <- struct{}{}:
		default:
		}

		// Hang until the test is done.
		select {
		case <-ctx.Done():
			tb.Logf("context done")
		case <-done:
			tb.Logf("function completed")
		}
		return nil, fmt.Errorf("canceled")
	}
	return fn, gotConn
}

// TestTCPForwardLimits verifies that the limits on the TCP forwarder work in a
// success case (i.e. when we don't hit the limit).
func TestTCPForwardLimits(t *testing.T) {
	envknob.Setenv("TS_DEBUG_NETSTACK", "true")
	impl := makeNetstack(t, func(impl *Impl) {
		impl.ProcessSubnets = true
	})

	dialFn, gotConn := makeHangDialer(t)
	impl.forwardDialFunc = dialFn

	prefs := ipn.NewPrefs()
	prefs.AdvertiseRoutes = []netip.Prefix{
		// This is the TEST-NET-1 IP block for use in documentation,
		// and should never actually be routable.
		netip.MustParsePrefix("192.0.2.0/24"),
	}
	impl.lb.Start(ipn.Options{
		UpdatePrefs: prefs,
	})
	impl.atomicIsLocalIPFunc.Store(looksLikeATailscaleSelfAddress)

	// Inject an "outbound" packet that's going to an IP address that times
	// out. We need to re-parse from a byte slice so that the internal
	// buffer in the packet.Parsed type is filled out.
	client := netip.MustParseAddr("100.101.102.103")
	destAddr := netip.MustParseAddr("192.0.2.1")
	pkt := tcp4syn(t, client, destAddr, 1234, 4567)
	var parsed packet.Parsed
	parsed.Decode(pkt)

	// When injecting this packet, we want the outcome to be "drop
	// silently", which indicates that netstack is processing the
	// packet and not delivering it to the host system.
	if resp, _ := impl.injectInbound(&parsed, impl.tundev, nil); resp != filter.DropSilently {
		t.Errorf("got filter outcome %v, want filter.DropSilently", resp)
	}

	ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
	defer cancel()

	// Wait until we have an in-flight outgoing connection.
	select {
	case <-ctx.Done():
		t.Fatalf("timed out waiting for connection")
	case <-gotConn:
		t.Logf("got connection in progress")
	}

	// Inject another packet, which will be deduplicated and thus not
	// increment our counter.
	parsed.Decode(pkt)
	if resp, _ := impl.injectInbound(&parsed, impl.tundev, nil); resp != filter.DropSilently {
		t.Errorf("got filter outcome %v, want filter.DropSilently", resp)
	}

	// Verify that we now have a single in-flight address in our map.
	impl.mu.Lock()
	inFlight := maps.Clone(impl.connsInFlightByClient)
	impl.mu.Unlock()

	if got, ok := inFlight[client]; !ok || got != 1 {
		t.Errorf("expected 1 in-flight connection for %v, got: %v", client, inFlight)
	}

	// Get the expvar statistics and verify that we're exporting the
	// correct metric.
	metrics := impl.ExpVar().(*metrics.Set)

	const metricName = "gauge_tcp_forward_in_flight"
	if v := metrics.Get(metricName).String(); v != "1" {
		t.Errorf("got metric %q=%s, want 1", metricName, v)
	}
}

// TestTCPForwardLimits_PerClient verifies that the per-client limit for TCP
// forwarding works.
func TestTCPForwardLimits_PerClient(t *testing.T) {
	envknob.Setenv("TS_DEBUG_NETSTACK", "true")

	// Set our test override limits during this test.
	tstest.Replace(t, &maxInFlightConnectionAttemptsForTest, 2)
	tstest.Replace(t, &maxInFlightConnectionAttemptsPerClientForTest, 1)

	impl := makeNetstack(t, func(impl *Impl) {
		impl.ProcessSubnets = true
	})

	dialFn, gotConn := makeHangDialer(t)
	impl.forwardDialFunc = dialFn

	prefs := ipn.NewPrefs()
	prefs.AdvertiseRoutes = []netip.Prefix{
		// This is the TEST-NET-1 IP block for use in documentation,
		// and should never actually be routable.
		netip.MustParsePrefix("192.0.2.0/24"),
	}
	impl.lb.Start(ipn.Options{
		UpdatePrefs: prefs,
	})
	impl.atomicIsLocalIPFunc.Store(looksLikeATailscaleSelfAddress)

	// Inject an "outbound" packet that's going to an IP address that times
	// out. We need to re-parse from a byte slice so that the internal
	// buffer in the packet.Parsed type is filled out.
	client := netip.MustParseAddr("100.101.102.103")
	destAddr := netip.MustParseAddr("192.0.2.1")

	// Helpers
	var port uint16 = 1234
	mustInjectPacket := func() {
		pkt := tcp4syn(t, client, destAddr, port, 4567)
		port++ // to avoid deduplication based on endpoint

		var parsed packet.Parsed
		parsed.Decode(pkt)

		// When injecting this packet, we want the outcome to be "drop
		// silently", which indicates that netstack is processing the
		// packet and not delivering it to the host system.
		if resp, _ := impl.injectInbound(&parsed, impl.tundev, nil); resp != filter.DropSilently {
			t.Fatalf("got filter outcome %v, want filter.DropSilently", resp)
		}
	}

	ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
	defer cancel()

	waitPacket := func() {
		select {
		case <-ctx.Done():
			t.Fatalf("timed out waiting for connection")
		case <-gotConn:
			t.Logf("got connection in progress")
		}
	}

	// Inject the packet to start the TCP forward and wait until we have an
	// in-flight outgoing connection.
	mustInjectPacket()
	waitPacket()

	// Verify that we now have a single in-flight address in our map.
	impl.mu.Lock()
	inFlight := maps.Clone(impl.connsInFlightByClient)
	impl.mu.Unlock()

	if got, ok := inFlight[client]; !ok || got != 1 {
		t.Errorf("expected 1 in-flight connection for %v, got: %v", client, inFlight)
	}

	metrics := impl.ExpVar().(*metrics.Set)

	// One client should have reached the limit at this point.
	if v := metrics.Get("gauge_tcp_forward_in_flight_per_client_limit_reached").String(); v != "1" {
		t.Errorf("got limit reached expvar metric=%s, want 1", v)
	}

	// Inject another packet, and verify that we've incremented our
	// "dropped" metrics since this will have been dropped.
	mustInjectPacket()

	// expvar metric
	const metricName = "counter_tcp_forward_max_in_flight_per_client_drop"
	if v := metrics.Get(metricName).String(); v != "1" {
		t.Errorf("got expvar metric %q=%s, want 1", metricName, v)
	}

	// client metric
	if v := metricPerClientForwardLimit.Value(); v != 1 {
		t.Errorf("got clientmetric limit metric=%d, want 1", v)
	}
}

// TestHandleLocalPackets tests the handleLocalPackets function, ensuring that
// we are properly deciding to handle packets that are destined for "local"
// IPs–addresses that are either for this node, or that it is responsible for.
//
// See, e.g. #11304
func TestHandleLocalPackets(t *testing.T) {
	var (
		selfIP4 = netip.MustParseAddr("100.64.1.2")
		selfIP6 = netip.MustParseAddr("fd7a:115c:a1e0::123")
	)

	impl := makeNetstack(t, func(impl *Impl) {
		impl.ProcessSubnets = false
		impl.ProcessLocalIPs = false
		impl.atomicIsLocalIPFunc.Store(func(addr netip.Addr) bool {
			return addr == selfIP4 || addr == selfIP6
		})
	})

	prefs := ipn.NewPrefs()
	prefs.AdvertiseRoutes = []netip.Prefix{
		// $ tailscale debug via 7 10.1.1.0/24
		// fd7a:115c:a1e0:b1a:0:7:a01:100/120
		netip.MustParsePrefix("fd7a:115c:a1e0:b1a:0:7:a01:100/120"),
	}
	_, err := impl.lb.EditPrefs(&ipn.MaskedPrefs{
		Prefs:              *prefs,
		AdvertiseRoutesSet: true,
	})
	if err != nil {
		t.Fatalf("EditPrefs: %v", err)
	}

	t.Run("ShouldHandleServiceIP", func(t *testing.T) {
		pkt := &packet.Parsed{
			IPVersion: 4,
			IPProto:   ipproto.TCP,
			Src:       netip.MustParseAddrPort("127.0.0.1:9999"),
			Dst:       netip.MustParseAddrPort("100.100.100.100:53"),
			TCPFlags:  packet.TCPSyn,
		}
		resp, _ := impl.handleLocalPackets(pkt, impl.tundev, nil)
		if resp != filter.DropSilently {
			t.Errorf("got filter outcome %v, want filter.DropSilently", resp)
		}
	})
	t.Run("ShouldHandle4via6", func(t *testing.T) {
		pkt := &packet.Parsed{
			IPVersion: 6,
			IPProto:   ipproto.TCP,
			Src:       netip.MustParseAddrPort("[::1]:1234"),

			// This is an IP in the above 4via6 subnet that this node handles.
			//    $ tailscale debug via 7 10.1.1.9/24
			//    fd7a:115c:a1e0:b1a:0:7:a01:109/120
			Dst:      netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:7:a01:109]:5678"),
			TCPFlags: packet.TCPSyn,
		}
		resp, _ := impl.handleLocalPackets(pkt, impl.tundev, nil)

		// DropSilently is the outcome we expected, since we actually
		// handled this packet by injecting it into netstack, which
		// will handle creating the TCP forwarder. We drop it so we
		// don't process the packet outside of netstack.
		if resp != filter.DropSilently {
			t.Errorf("got filter outcome %v, want filter.DropSilently", resp)
		}
	})
	t.Run("OtherNonHandled", func(t *testing.T) {
		pkt := &packet.Parsed{
			IPVersion: 6,
			IPProto:   ipproto.TCP,
			Src:       netip.MustParseAddrPort("[::1]:1234"),

			// This IP is *not* in the above 4via6 route
			//    $ tailscale debug via 99 10.1.1.9/24
			//    fd7a:115c:a1e0:b1a:0:63:a01:109/120
			Dst:      netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:63:a01:109]:5678"),
			TCPFlags: packet.TCPSyn,
		}
		resp, _ := impl.handleLocalPackets(pkt, impl.tundev, nil)

		// Accept means that handleLocalPackets does not handle this
		// packet, we "accept" it to continue further processing,
		// instead of dropping because it was already handled.
		if resp != filter.Accept {
			t.Errorf("got filter outcome %v, want filter.Accept", resp)
		}
	})
}

func TestShouldSendToHost(t *testing.T) {
	var (
		selfIP4 = netip.MustParseAddr("100.64.1.2")
		selfIP6 = netip.MustParseAddr("fd7a:115c:a1e0::123")
	)

	makeTestNetstack := func(tb testing.TB) *Impl {
		impl := makeNetstack(tb, func(impl *Impl) {
			impl.ProcessSubnets = false
			impl.ProcessLocalIPs = false
			impl.atomicIsLocalIPFunc.Store(func(addr netip.Addr) bool {
				return addr == selfIP4 || addr == selfIP6
			})
		})

		prefs := ipn.NewPrefs()
		prefs.AdvertiseRoutes = []netip.Prefix{
			// $ tailscale debug via 7 10.1.1.0/24
			// fd7a:115c:a1e0:b1a:0:7:a01:100/120
			netip.MustParsePrefix("fd7a:115c:a1e0:b1a:0:7:a01:100/120"),
		}
		_, err := impl.lb.EditPrefs(&ipn.MaskedPrefs{
			Prefs:              *prefs,
			AdvertiseRoutesSet: true,
		})
		if err != nil {
			tb.Fatalf("EditPrefs: %v", err)
		}
		return impl
	}

	testCases := []struct {
		name     string
		src, dst netip.AddrPort
		want     bool
	}{
		// Reply from service IP to localhost should be sent to host,
		// not over WireGuard.
		{
			name: "from_service_ip_to_localhost",
			src:  netip.AddrPortFrom(serviceIP, 53),
			dst:  netip.MustParseAddrPort("127.0.0.1:9999"),
			want: true,
		},
		{
			name: "from_service_ip_to_localhost_v6",
			src:  netip.AddrPortFrom(serviceIPv6, 53),
			dst:  netip.MustParseAddrPort("[::1]:9999"),
			want: true,
		},
		// A reply from the local IP to a remote host isn't sent to the
		// host, but rather over WireGuard.
		{
			name: "local_ip_to_remote",
			src:  netip.AddrPortFrom(selfIP4, 12345),
			dst:  netip.MustParseAddrPort("100.64.99.88:7777"),
			want: false,
		},
		{
			name: "local_ip_to_remote_v6",
			src:  netip.AddrPortFrom(selfIP6, 12345),
			dst:  netip.MustParseAddrPort("[fd7a:115:a1e0::99]:7777"),
			want: false,
		},
		// A reply from a 4via6 address to a remote host isn't sent to
		// the local host, but rather over WireGuard. See:
		//     https://github.com/tailscale/tailscale/issues/12448
		{
			name: "4via6_to_remote",

			// $ tailscale debug via 7 10.1.1.99/24
			// fd7a:115c:a1e0:b1a:0:7:a01:163/120
			src:  netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:7:a01:163]:12345"),
			dst:  netip.MustParseAddrPort("[fd7a:115:a1e0::99]:7777"),
			want: false,
		},
		// However, a reply from a 4via6 address to the local Tailscale
		// IP for this host *is* sent to the local host. See:
		//     https://github.com/tailscale/tailscale/issues/11304
		{
			name: "4via6_to_local",

			// $ tailscale debug via 7 10.1.1.99/24
			// fd7a:115c:a1e0:b1a:0:7:a01:163/120
			src:  netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:7:a01:163]:12345"),
			dst:  netip.AddrPortFrom(selfIP6, 7777),
			want: true,
		},
		// Traffic from a 4via6 address that we're not handling to
		// either the local Tailscale IP or a remote host is sent
		// outbound.
		//
		// In most cases, we won't see this type of traffic in the
		// shouldSendToHost function, but let's confirm.
		{
			name: "other_4via6_to_local",

			// $ tailscale debug via 4444 10.1.1.88/24
			// fd7a:115c:a1e0:b1a:0:7:a01:163/120
			src:  netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:115c:a01:158]:12345"),
			dst:  netip.AddrPortFrom(selfIP6, 7777),
			want: false,
		},
		{
			name: "other_4via6_to_remote",

			// $ tailscale debug via 4444 10.1.1.88/24
			// fd7a:115c:a1e0:b1a:0:7:a01:163/120
			src:  netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:115c:a01:158]:12345"),
			dst:  netip.MustParseAddrPort("[fd7a:115:a1e0::99]:7777"),
			want: false,
		},
	}

	for _, tt := range testCases {
		t.Run(tt.name, func(t *testing.T) {
			var pkt *stack.PacketBuffer
			if tt.src.Addr().Is4() {
				pkt = makeUDP4PacketBuffer(tt.src, tt.dst)
			} else {
				pkt = makeUDP6PacketBuffer(tt.src, tt.dst)
			}

			ns := makeTestNetstack(t)
			if got := ns.shouldSendToHost(pkt); got != tt.want {
				t.Errorf("shouldSendToHost returned %v, want %v", got, tt.want)
			}
		})
	}
}

func makeUDP4PacketBuffer(src, dst netip.AddrPort) *stack.PacketBuffer {
	if !src.Addr().Is4() || !dst.Addr().Is4() {
		panic("src and dst must be IPv4")
	}

	data := []byte("hello world\n")

	packetLen := header.IPv4MinimumSize + header.UDPMinimumSize
	pkt := stack.NewPacketBuffer(stack.PacketBufferOptions{
		ReserveHeaderBytes: packetLen,
		Payload:            buffer.MakeWithData(data),
	})

	// Initialize the UDP header.
	udp := header.UDP(pkt.TransportHeader().Push(header.UDPMinimumSize))
	pkt.TransportProtocolNumber = header.UDPProtocolNumber

	length := uint16(pkt.Size())
	udp.Encode(&header.UDPFields{
		SrcPort: src.Port(),
		DstPort: dst.Port(),
		Length:  length,
	})

	// Add IP header
	ipHdr := header.IPv4(pkt.NetworkHeader().Push(header.IPv4MinimumSize))
	pkt.NetworkProtocolNumber = header.IPv4ProtocolNumber
	ipHdr.Encode(&header.IPv4Fields{
		TotalLength: uint16(packetLen),
		Protocol:    uint8(header.UDPProtocolNumber),
		SrcAddr:     tcpip.AddrFrom4(src.Addr().As4()),
		DstAddr:     tcpip.AddrFrom4(dst.Addr().As4()),
		Checksum:    0,
	})

	return pkt
}

func makeUDP6PacketBuffer(src, dst netip.AddrPort) *stack.PacketBuffer {
	if !src.Addr().Is6() || !dst.Addr().Is6() {
		panic("src and dst must be IPv6")
	}
	data := []byte("hello world\n")

	packetLen := header.IPv6MinimumSize + header.UDPMinimumSize
	pkt := stack.NewPacketBuffer(stack.PacketBufferOptions{
		ReserveHeaderBytes: packetLen,
		Payload:            buffer.MakeWithData(data),
	})

	srcAddr := tcpip.AddrFrom16(src.Addr().As16())
	dstAddr := tcpip.AddrFrom16(dst.Addr().As16())

	// Add IP header
	ipHdr := header.IPv6(pkt.NetworkHeader().Push(header.IPv6MinimumSize))
	pkt.NetworkProtocolNumber = header.IPv6ProtocolNumber
	ipHdr.Encode(&header.IPv6Fields{
		SrcAddr:           srcAddr,
		DstAddr:           dstAddr,
		PayloadLength:     uint16(header.UDPMinimumSize + len(data)),
		TransportProtocol: header.UDPProtocolNumber,
		HopLimit:          64,
	})

	// Initialize the UDP header.
	udp := header.UDP(pkt.TransportHeader().Push(header.UDPMinimumSize))
	pkt.TransportProtocolNumber = header.UDPProtocolNumber

	length := uint16(pkt.Size())
	udp.Encode(&header.UDPFields{
		SrcPort: src.Port(),
		DstPort: dst.Port(),
		Length:  length,
	})

	// Calculate the UDP pseudo-header checksum.
	xsum := header.PseudoHeaderChecksum(header.UDPProtocolNumber, srcAddr, dstAddr, uint16(len(udp)))
	udp.SetChecksum(^udp.CalculateChecksum(xsum))

	return pkt
}
-												all: update copyright and license headers

This updates all source files to use a new standard header for copyright
and license declaration.  Notably, copyright no longer includes a date,
and we now use the standard SPDX-License-Identifier header.

This commit was done almost entirely mechanically with perl, and then
some minimal manual fixes.

Updates #6865

Signed-off-by: Will Norris <will@tailscale.com>

											
										
										
											2023-01-27 21:37:20 +00:00
+								// Copyright (c) Tailscale Inc & AUTHORS
 								// SPDX-License-Identifier: BSD-3-Clause
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
 								package netstack
 								import (
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
+									"context"
-												wgengine/netstack: always respond to 4via6 echo requests (#5712)

As the comment in the code says, netstack should always respond to ICMP
echo requests to a 4via6 address, even if the netstack instance isn't
normally processing subnet traffic.

Follow-up to #5709

Change-Id: I504d0776c5824071b2a2e0e687bc33e24f6c4746
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 22:07:57 +00:00
+									"fmt"
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
+									"maps"
 									"net"
-												all: convert more code to use net/netip directly

    perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
    perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
    perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
    perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
    perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
    perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
    goimports -w .

Then delete some stuff from the net/netaddr shim package which is no
longer neeed.

Updates #5162

Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-07-26 04:14:09 +00:00
+									"net/netip"
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
+									"runtime"
 									"testing"
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
+									"time"
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
-												wgengine/netstack: add test for #12448

This refactors the logic for determining whether a packet should be sent
to the host or not into a function, and then adds tests for it.

Updates #11304
Updates #12448

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ief9afa98eaffae00e21ceb7db073c61b170355e5

											
										
										
											2024-06-13 17:48:45 +00:00
+									"gvisor.dev/gvisor/pkg/buffer"
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
+									"gvisor.dev/gvisor/pkg/tcpip"
 									"gvisor.dev/gvisor/pkg/tcpip/header"
-												wgengine/netstack: add test for #12448

This refactors the logic for determining whether a packet should be sent
to the host or not into a function, and then adds tests for it.

Updates #11304
Updates #12448

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ief9afa98eaffae00e21ceb7db073c61b170355e5

											
										
										
											2024-06-13 17:48:45 +00:00
+									"gvisor.dev/gvisor/pkg/tcpip/stack"
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
+									"tailscale.com/envknob"
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+									"tailscale.com/ipn"
 									"tailscale.com/ipn/ipnlocal"
 									"tailscale.com/ipn/store/mem"
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
+									"tailscale.com/metrics"
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
+									"tailscale.com/net/packet"
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+									"tailscale.com/net/tsaddr"
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
+									"tailscale.com/net/tsdial"
 									"tailscale.com/net/tstun"
-												tsd: add package with System type to unify subsystem init, discovery

This is part of an effort to clean up tailscaled initialization between
tailscaled, tailscaled Windows service, tsnet, and the mac GUI.

Updates #8036

Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2023-05-03 20:57:17 +00:00
+									"tailscale.com/tsd"
-												wgengine/netstack: fix data race in tests

This uses the helper function added in #6173 to avoid flakes like:
    https://github.com/tailscale/tailscale/actions/runs/3826912237/jobs/6511078024

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: If3f1d3b9c0f64ffcb4ba9a30d3522ec49484f993

											
										
										
											2023-01-19 14:48:39 +00:00
+									"tailscale.com/tstest"
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
+									"tailscale.com/types/ipproto"
-												all: pass log IDs as the proper type rather than strings

This change focuses on the backend log ID, which is the mostly commonly
used in the client.  Tests which don't seem to make use of the log ID
just use the zero value.

Signed-off-by: Will Norris <will@tailscale.com>

											
										
										
											2023-03-23 17:49:56 +00:00
+									"tailscale.com/types/logid"
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
+									"tailscale.com/wgengine"
 									"tailscale.com/wgengine/filter"
 								)
 								// TestInjectInboundLeak tests that injectInbound doesn't leak memory.
 								// See https://github.com/tailscale/tailscale/issues/3762
 								func TestInjectInboundLeak(t *testing.T) {
 									tunDev := tstun.NewFake()
 									dialer := new(tsdial.Dialer)
-												all: use any instead of interface{}

My favorite part of generics.

Signed-off-by: Josh Bleecher Snyder <josh@tailscale.com>
											
										
										
											2022-03-16 23:27:57 +00:00
+									logf := func(format string, args ...any) {
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
+										if !t.Failed() {
 											t.Logf(format, args...)
 										}
 									}
-												tsd: add package with System type to unify subsystem init, discovery

This is part of an effort to clean up tailscaled initialization between
tailscaled, tailscaled Windows service, tsnet, and the mac GUI.

Updates #8036

Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2023-05-03 20:57:17 +00:00
+									sys := new(tsd.System)
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
+									eng, err := wgengine.NewUserspaceEngine(logf, wgengine.Config{
-												ipn/ipnlocal, all: plumb health trackers in tests

I saw some panics in CI, like:

    2024-05-08T04:30:25.9553518Z ## WARNING: (non-fatal) nil health.Tracker (being strict in CI):
    2024-05-08T04:30:25.9554043Z goroutine 801 [running]:
    2024-05-08T04:30:25.9554489Z tailscale.com/health.(*Tracker).nil(0x0)
    2024-05-08T04:30:25.9555086Z 	tailscale.com/health/health.go:185 +0x70
    2024-05-08T04:30:25.9555688Z tailscale.com/health.(*Tracker).SetUDP4Unbound(0x0, 0x0)
    2024-05-08T04:30:25.9556373Z 	tailscale.com/health/health.go:532 +0x2f
    2024-05-08T04:30:25.9557296Z tailscale.com/wgengine/magicsock.(*Conn).bindSocket(0xc0003b4808, 0xc0003b4878, {0x1fbca53, 0x4}, 0x0)
    2024-05-08T04:30:25.9558301Z 	tailscale.com/wgengine/magicsock/magicsock.go:2481 +0x12c5
    2024-05-08T04:30:25.9559026Z tailscale.com/wgengine/magicsock.(*Conn).rebind(0xc0003b4808, 0x0)
    2024-05-08T04:30:25.9559874Z 	tailscale.com/wgengine/magicsock/magicsock.go:2510 +0x16f
    2024-05-08T04:30:25.9561038Z tailscale.com/wgengine/magicsock.NewConn({0xc000063c80, 0x0, 0xc000197930, 0xc000197950, 0xc000197960, {0x0, 0x0}, 0xc000197970, 0xc000198ee0, 0x0, ...})
    2024-05-08T04:30:25.9562402Z 	tailscale.com/wgengine/magicsock/magicsock.go:476 +0xd5f
    2024-05-08T04:30:25.9563779Z tailscale.com/wgengine.NewUserspaceEngine(0xc000063c80, {{0x22c8750, 0xc0001976b0}, 0x0, {0x22c3210, 0xc000063c80}, {0x22c31d8, 0x2d3c900}, 0x0, 0x0, ...})
    2024-05-08T04:30:25.9564982Z 	tailscale.com/wgengine/userspace.go:389 +0x159d
    2024-05-08T04:30:25.9565529Z tailscale.com/ipn/ipnlocal.newTestBackend(0xc000358b60)
    2024-05-08T04:30:25.9566086Z 	tailscale.com/ipn/ipnlocal/serve_test.go:675 +0x2a5
    2024-05-08T04:30:25.9566612Z ta

Updates #11874

Change-Id: I3432ed52d670743e532be4642f38dbd6e3763b1b
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2024-05-08 04:37:33 +00:00
+										Tun:           tunDev,
 										Dialer:        dialer,
 										SetSubsystem:  sys.Set,
 										HealthTracker: sys.HealthTracker(),
-												util/usermetrics: make usermetrics non-global

this commit changes usermetrics to be non-global, this is a building
block for correct metrics if a go process runs multiple tsnets or
in tests.

Updates #13420
Updates tailscale/corp#22075

Signed-off-by: Kristoffer Dalby <kristoffer@tailscale.com>

											
										
										
											2024-09-23 16:34:00 +00:00
+										Metrics:       sys.UserMetricsRegistry(),
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
+									})
 									if err != nil {
 										t.Fatal(err)
 									}
 									defer eng.Close()
-												tsd: add package with System type to unify subsystem init, discovery

This is part of an effort to clean up tailscaled initialization between
tailscaled, tailscaled Windows service, tsnet, and the mac GUI.

Updates #8036

Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2023-05-03 20:57:17 +00:00
+									sys.Set(eng)
 									sys.Set(new(mem.Store))
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
-												tsd: add package with System type to unify subsystem init, discovery

This is part of an effort to clean up tailscaled initialization between
tailscaled, tailscaled Windows service, tsnet, and the mac GUI.

Updates #8036

Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2023-05-03 20:57:17 +00:00
+									tunWrap := sys.Tun.Get()
 									lb, err := ipnlocal.NewLocalBackend(logf, logid.PublicID{}, sys, 0)
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+									if err != nil {
 										t.Fatal(err)
 									}
-												wgengine/netstack: remove unused taildrive deps

A filesystem was plumbed into netstack in 993acf4475b22d693
but hasn't been used since 2d5d6f5403f3. Remove it.

Noticed while rebasing a Tailscale fork elsewhere.

Updates tailscale/corp#16827

Change-Id: Ib76deeda205ffe912b77a59b9d22853ebff42813
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2024-11-01 17:50:40 +00:00
+									ns, err := Create(logf, tunWrap, eng, sys.MagicSock.Get(), dialer, sys.DNSManager.Get(), sys.ProxyMapper())
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
+									if err != nil {
 										t.Fatal(err)
 									}
 									defer ns.Close()
 									ns.ProcessLocalIPs = true
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+									if err := ns.Start(lb); err != nil {
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
+										t.Fatalf("Start: %v", err)
 									}
-												all: convert more code to use net/netip directly

    perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
    perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
    perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
    perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
    perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
    perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
    goimports -w .

Then delete some stuff from the net/netaddr shim package which is no
longer neeed.

Updates #5162

Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-07-26 04:14:09 +00:00
+									ns.atomicIsLocalIPFunc.Store(func(netip.Addr) bool { return true })
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
 									pkt := &packet.Parsed{}
 									const N = 10_000
 									ms0 := getMemStats()
-												all: use Go 1.22 range-over-int

Updates #11058

Change-Id: I35e7ef9b90e83cac04ca93fd964ad00ed5b48430
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2024-04-16 20:15:13 +00:00
+									for range N {
-												net/tstun,wgengine{/netstack/gro}: refactor and re-enable gVisor GRO for Linux (#13172)

In 2f27319baf71681e221904d3a3ffe1badedc8e2e we disabled GRO due to a
data race around concurrent calls to tstun.Wrapper.Write(). This commit
refactors GRO to be thread-safe, and re-enables it on Linux.

This refactor now carries a GRO type across tstun and netstack APIs
with a lifetime that is scoped to a single tstun.Wrapper.Write() call.

In 25f0a3fc8f6f9cf681bb5afda8e1762816c67a8b we used build tags to
prevent importation of gVisor's GRO package on iOS as at the time we
believed it was contributing to additional memory usage on that
platform. It wasn't, so this commit simplifies and removes those
build tags.

Updates tailscale/corp#22353
Updates tailscale/corp#22125
Updates #6816

Signed-off-by: Jordan Whited <jordan@tailscale.com>
											
										
										
											2024-08-20 22:22:19 +00:00
+										outcome, _ := ns.injectInbound(pkt, tunWrap, nil)
-												wgengine/netstack: add a missing refcount decrement after packet injection

Fixes #3762
Updates #3745 (probably fixes?)

Change-Id: I1d3f0590fd5b8adfbc9110bc45ff717bb9e79aae
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-01-19 20:05:17 +00:00
+										if outcome != filter.DropSilently {
 											t.Fatalf("got outcome %v; want DropSilently", outcome)
 										}
 									}
 									ms1 := getMemStats()
 									if grew := int64(ms1.HeapObjects) - int64(ms0.HeapObjects); grew >= N {
 										t.Fatalf("grew by %v (which is too much and >= the %v packets we sent)", grew, N)
 									}
 								}
 								func getMemStats() (ms runtime.MemStats) {
 									runtime.GC()
 									runtime.ReadMemStats(&ms)
 									return
 								}
-												wgengine/netstack: disable refsvfs2 leak tracking (#4378)

In addition an envknob (TS_DEBUG_NETSTACK_LEAK_MODE) now provides access
to set leak tracking to more useful values.

Fixes #4309

Signed-off-by: James Tucker <james@tailscale.com>
											
										
										
											2022-04-08 00:21:45 +00:00
-												wgengine/netstack: add test for #12448

This refactors the logic for determining whether a packet should be sent
to the host or not into a function, and then adds tests for it.

Updates #11304
Updates #12448

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ief9afa98eaffae00e21ceb7db073c61b170355e5

											
										
										
											2024-06-13 17:48:45 +00:00
+								func makeNetstack(tb testing.TB, config func(*Impl)) *Impl {
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
+									tunDev := tstun.NewFake()
-												tsd: add package with System type to unify subsystem init, discovery

This is part of an effort to clean up tailscaled initialization between
tailscaled, tailscaled Windows service, tsnet, and the mac GUI.

Updates #8036

Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2023-05-03 20:57:17 +00:00
+									sys := &tsd.System{}
 									sys.Set(new(mem.Store))
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
+									dialer := new(tsdial.Dialer)
-												wgengine/netstack: add test for #12448

This refactors the logic for determining whether a packet should be sent
to the host or not into a function, and then adds tests for it.

Updates #11304
Updates #12448

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ief9afa98eaffae00e21ceb7db073c61b170355e5

											
										
										
											2024-06-13 17:48:45 +00:00
+									logf := tstest.WhileTestRunningLogger(tb)
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
+									eng, err := wgengine.NewUserspaceEngine(logf, wgengine.Config{
-												ipn/ipnlocal, all: plumb health trackers in tests

I saw some panics in CI, like:

    2024-05-08T04:30:25.9553518Z ## WARNING: (non-fatal) nil health.Tracker (being strict in CI):
    2024-05-08T04:30:25.9554043Z goroutine 801 [running]:
    2024-05-08T04:30:25.9554489Z tailscale.com/health.(*Tracker).nil(0x0)
    2024-05-08T04:30:25.9555086Z 	tailscale.com/health/health.go:185 +0x70
    2024-05-08T04:30:25.9555688Z tailscale.com/health.(*Tracker).SetUDP4Unbound(0x0, 0x0)
    2024-05-08T04:30:25.9556373Z 	tailscale.com/health/health.go:532 +0x2f
    2024-05-08T04:30:25.9557296Z tailscale.com/wgengine/magicsock.(*Conn).bindSocket(0xc0003b4808, 0xc0003b4878, {0x1fbca53, 0x4}, 0x0)
    2024-05-08T04:30:25.9558301Z 	tailscale.com/wgengine/magicsock/magicsock.go:2481 +0x12c5
    2024-05-08T04:30:25.9559026Z tailscale.com/wgengine/magicsock.(*Conn).rebind(0xc0003b4808, 0x0)
    2024-05-08T04:30:25.9559874Z 	tailscale.com/wgengine/magicsock/magicsock.go:2510 +0x16f
    2024-05-08T04:30:25.9561038Z tailscale.com/wgengine/magicsock.NewConn({0xc000063c80, 0x0, 0xc000197930, 0xc000197950, 0xc000197960, {0x0, 0x0}, 0xc000197970, 0xc000198ee0, 0x0, ...})
    2024-05-08T04:30:25.9562402Z 	tailscale.com/wgengine/magicsock/magicsock.go:476 +0xd5f
    2024-05-08T04:30:25.9563779Z tailscale.com/wgengine.NewUserspaceEngine(0xc000063c80, {{0x22c8750, 0xc0001976b0}, 0x0, {0x22c3210, 0xc000063c80}, {0x22c31d8, 0x2d3c900}, 0x0, 0x0, ...})
    2024-05-08T04:30:25.9564982Z 	tailscale.com/wgengine/userspace.go:389 +0x159d
    2024-05-08T04:30:25.9565529Z tailscale.com/ipn/ipnlocal.newTestBackend(0xc000358b60)
    2024-05-08T04:30:25.9566086Z 	tailscale.com/ipn/ipnlocal/serve_test.go:675 +0x2a5
    2024-05-08T04:30:25.9566612Z ta

Updates #11874

Change-Id: I3432ed52d670743e532be4642f38dbd6e3763b1b
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2024-05-08 04:37:33 +00:00
+										Tun:           tunDev,
 										Dialer:        dialer,
 										SetSubsystem:  sys.Set,
 										HealthTracker: sys.HealthTracker(),
-												util/usermetrics: make usermetrics non-global

this commit changes usermetrics to be non-global, this is a building
block for correct metrics if a go process runs multiple tsnets or
in tests.

Updates #13420
Updates tailscale/corp#22075

Signed-off-by: Kristoffer Dalby <kristoffer@tailscale.com>

											
										
										
											2024-09-23 16:34:00 +00:00
+										Metrics:       sys.UserMetricsRegistry(),
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
+									})
 									if err != nil {
-												wgengine/netstack: add test for #12448

This refactors the logic for determining whether a packet should be sent
to the host or not into a function, and then adds tests for it.

Updates #11304
Updates #12448

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ief9afa98eaffae00e21ceb7db073c61b170355e5

											
										
										
											2024-06-13 17:48:45 +00:00
+										tb.Fatal(err)
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
+									}
-												wgengine/netstack: add test for #12448

This refactors the logic for determining whether a packet should be sent
to the host or not into a function, and then adds tests for it.

Updates #11304
Updates #12448

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ief9afa98eaffae00e21ceb7db073c61b170355e5

											
										
										
											2024-06-13 17:48:45 +00:00
+									tb.Cleanup(func() { eng.Close() })
-												tsd: add package with System type to unify subsystem init, discovery

This is part of an effort to clean up tailscaled initialization between
tailscaled, tailscaled Windows service, tsnet, and the mac GUI.

Updates #8036

Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2023-05-03 20:57:17 +00:00
+									sys.Set(eng)
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
-												wgengine/netstack: remove unused taildrive deps

A filesystem was plumbed into netstack in 993acf4475b22d693
but hasn't been used since 2d5d6f5403f3. Remove it.

Noticed while rebasing a Tailscale fork elsewhere.

Updates tailscale/corp#16827

Change-Id: Ib76deeda205ffe912b77a59b9d22853ebff42813
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2024-11-01 17:50:40 +00:00
+									ns, err := Create(logf, sys.Tun.Get(), eng, sys.MagicSock.Get(), dialer, sys.DNSManager.Get(), sys.ProxyMapper())
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
+									if err != nil {
-												wgengine/netstack: add test for #12448

This refactors the logic for determining whether a packet should be sent
to the host or not into a function, and then adds tests for it.

Updates #11304
Updates #12448

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ief9afa98eaffae00e21ceb7db073c61b170355e5

											
										
										
											2024-06-13 17:48:45 +00:00
+										tb.Fatal(err)
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
+									}
-												wgengine/netstack: add test for #12448

This refactors the logic for determining whether a packet should be sent
to the host or not into a function, and then adds tests for it.

Updates #11304
Updates #12448

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ief9afa98eaffae00e21ceb7db073c61b170355e5

											
										
										
											2024-06-13 17:48:45 +00:00
+									tb.Cleanup(func() { ns.Close() })
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
-												tsd: add package with System type to unify subsystem init, discovery

This is part of an effort to clean up tailscaled initialization between
tailscaled, tailscaled Windows service, tsnet, and the mac GUI.

Updates #8036

Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2023-05-03 20:57:17 +00:00
+									lb, err := ipnlocal.NewLocalBackend(logf, logid.PublicID{}, sys, 0)
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+									if err != nil {
-												wgengine/netstack: add test for #12448

This refactors the logic for determining whether a packet should be sent
to the host or not into a function, and then adds tests for it.

Updates #11304
Updates #12448

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ief9afa98eaffae00e21ceb7db073c61b170355e5

											
										
										
											2024-06-13 17:48:45 +00:00
+										tb.Fatalf("NewLocalBackend: %v", err)
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+									}
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+									ns.atomicIsLocalIPFunc.Store(func(netip.Addr) bool { return true })
 									if config != nil {
 										config(ns)
 									}
 									if err := ns.Start(lb); err != nil {
-												wgengine/netstack: add test for #12448

This refactors the logic for determining whether a packet should be sent
to the host or not into a function, and then adds tests for it.

Updates #11304
Updates #12448

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ief9afa98eaffae00e21ceb7db073c61b170355e5

											
										
										
											2024-06-13 17:48:45 +00:00
+										tb.Fatalf("Start: %v", err)
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
+									}
 									return ns
 								}
 								func TestShouldHandlePing(t *testing.T) {
 									srcIP := netip.AddrFrom4([4]byte{1, 2, 3, 4})
 									t.Run("ICMP4", func(t *testing.T) {
 										dst := netip.MustParseAddr("5.6.7.8")
 										icmph := packet.ICMP4Header{
 											IP4Header: packet.IP4Header{
 												IPProto: ipproto.ICMPv4,
 												Src:     srcIP,
 												Dst:     dst,
 											},
 											Type: packet.ICMP4EchoRequest,
 											Code: packet.ICMP4NoCode,
 										}
 										_, payload := packet.ICMPEchoPayload(nil)
 										icmpPing := packet.Generate(icmph, payload)
 										pkt := &packet.Parsed{}
 										pkt.Decode(icmpPing)
 										impl := makeNetstack(t, func(impl *Impl) {
 											impl.ProcessSubnets = true
 										})
 										pingDst, ok := impl.shouldHandlePing(pkt)
 										if !ok {
 											t.Errorf("expected shouldHandlePing==true")
 										}
 										if pingDst != dst {
 											t.Errorf("got dst %s; want %s", pingDst, dst)
 										}
 									})
 									t.Run("ICMP6-no-via", func(t *testing.T) {
 										dst := netip.MustParseAddr("2a09:8280:1::4169")
 										icmph := packet.ICMP6Header{
 											IP6Header: packet.IP6Header{
 												IPProto: ipproto.ICMPv6,
 												Src:     srcIP,
 												Dst:     dst,
 											},
 											Type: packet.ICMP6EchoRequest,
 											Code: packet.ICMP6NoCode,
 										}
 										_, payload := packet.ICMPEchoPayload(nil)
 										icmpPing := packet.Generate(icmph, payload)
 										pkt := &packet.Parsed{}
 										pkt.Decode(icmpPing)
 										impl := makeNetstack(t, func(impl *Impl) {
 											impl.ProcessSubnets = true
 										})
 										pingDst, ok := impl.shouldHandlePing(pkt)
 										// Expect that we handle this since it's going out onto the
 										// network.
 										if !ok {
 											t.Errorf("expected shouldHandlePing==true")
 										}
 										if pingDst != dst {
 											t.Errorf("got dst %s; want %s", pingDst, dst)
 										}
 									})
 									t.Run("ICMP6-tailscale-addr", func(t *testing.T) {
 										dst := netip.MustParseAddr("fd7a:115c:a1e0:ab12::1")
 										icmph := packet.ICMP6Header{
 											IP6Header: packet.IP6Header{
 												IPProto: ipproto.ICMPv6,
 												Src:     srcIP,
 												Dst:     dst,
 											},
 											Type: packet.ICMP6EchoRequest,
 											Code: packet.ICMP6NoCode,
 										}
 										_, payload := packet.ICMPEchoPayload(nil)
 										icmpPing := packet.Generate(icmph, payload)
 										pkt := &packet.Parsed{}
 										pkt.Decode(icmpPing)
 										impl := makeNetstack(t, func(impl *Impl) {
 											impl.ProcessSubnets = true
 										})
 										_, ok := impl.shouldHandlePing(pkt)
 										// We don't handle this because it's a Tailscale IP and not 4via6
 										if ok {
 											t.Errorf("expected shouldHandlePing==false")
 										}
 									})
-												wgengine/netstack: always respond to 4via6 echo requests (#5712)

As the comment in the code says, netstack should always respond to ICMP
echo requests to a 4via6 address, even if the netstack instance isn't
normally processing subnet traffic.

Follow-up to #5709

Change-Id: I504d0776c5824071b2a2e0e687bc33e24f6c4746
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 22:07:57 +00:00
+									// Handle pings for 4via6 addresses regardless of ProcessSubnets
 									for _, subnets := range []bool{true, false} {
 										t.Run("ICMP6-4via6-ProcessSubnets-"+fmt.Sprint(subnets), func(t *testing.T) {
 											// The 4via6 route 10.1.1.0/24 siteid 7, and then the IP
 											// 10.1.1.9 within that route.
 											dst := netip.MustParseAddr("fd7a:115c:a1e0:b1a:0:7:a01:109")
 											expectedPingDst := netip.MustParseAddr("10.1.1.9")
 											icmph := packet.ICMP6Header{
 												IP6Header: packet.IP6Header{
 													IPProto: ipproto.ICMPv6,
 													Src:     srcIP,
 													Dst:     dst,
 												},
 												Type: packet.ICMP6EchoRequest,
 												Code: packet.ICMP6NoCode,
 											}
 											_, payload := packet.ICMPEchoPayload(nil)
 											icmpPing := packet.Generate(icmph, payload)
 											pkt := &packet.Parsed{}
 											pkt.Decode(icmpPing)
 											impl := makeNetstack(t, func(impl *Impl) {
 												impl.ProcessSubnets = subnets
 											})
 											pingDst, ok := impl.shouldHandlePing(pkt)
 											// Handled due to being 4via6
 											if !ok {
 												t.Errorf("expected shouldHandlePing==true")
 											} else if pingDst != expectedPingDst {
 												t.Errorf("got dst %s; want %s", pingDst, expectedPingDst)
 											}
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
+										})
-												wgengine/netstack: always respond to 4via6 echo requests (#5712)

As the comment in the code says, netstack should always respond to ICMP
echo requests to a 4via6 address, even if the netstack instance isn't
normally processing subnet traffic.

Follow-up to #5709

Change-Id: I504d0776c5824071b2a2e0e687bc33e24f6c4746
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 22:07:57 +00:00
+									}
-												wgengine/netstack: handle 4via6 packets when pinging (#5709)

Change-Id: Ib6ebbaa11219fb91b550ed7fc6ede61f83262e89
Signed-off-by: Andrew Dunham <andrew@tailscale.com>
											
										
										
											2022-09-21 18:19:34 +00:00
+								}
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
-												wgengine/netstack: optimize shouldProcessInbound, avoiding 4via6 lookups

All IPv6 packets for the self address were doing netip.Prefix.Contains
lookups.

If if we know they're for a self address (which we already previously
computed and have sitting in a bool), then they can't be for a 4via6
range.

Change-Id: Iaaaf1248cb3fecec229935a80548ead0eb4cb892
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-11-09 03:53:40 +00:00
+								// looksLikeATailscaleSelfAddress reports whether addr looks like
 								// a Tailscale self address, for tests.
 								func looksLikeATailscaleSelfAddress(addr netip.Addr) bool {
 									return addr.Is4() && tsaddr.IsTailscaleIP(addr) ||
 										addr.Is6() && tsaddr.Tailscale4To6Range().Contains(addr)
 								}
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+								func TestShouldProcessInbound(t *testing.T) {
 									testCases := []struct {
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+										name        string
 										pkt         *packet.Parsed
 										afterStart  func(*Impl) // optional; after Impl.Start is called
 										beforeStart func(*Impl) // optional; before Impl.Start is called
 										want        bool
 										runOnGOOS   string
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+									}{
 										{
 											name: "ipv6-via",
 											pkt: &packet.Parsed{
 												IPVersion: 6,
 												IPProto:   ipproto.TCP,
 												Src:       netip.MustParseAddrPort("100.101.102.103:1234"),
 												// $ tailscale debug via 7 10.1.1.9/24
 												// fd7a:115c:a1e0:b1a:0:7:a01:109/120
 												Dst:      netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:7:a01:109]:5678"),
 												TCPFlags: packet.TCPSyn,
 											},
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+											afterStart: func(i *Impl) {
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												prefs := ipn.NewPrefs()
 												prefs.AdvertiseRoutes = []netip.Prefix{
 													// $ tailscale debug via 7 10.1.1.0/24
 													// fd7a:115c:a1e0:b1a:0:7:a01:100/120
 													netip.MustParsePrefix("fd7a:115c:a1e0:b1a:0:7:a01:100/120"),
 												}
 												i.lb.Start(ipn.Options{
-												ipn: remove unused Options.LegacyMigrationPrefs

I'm on a mission to simplify LocalBackend.Start and its locking
and deflake some tests.

I noticed this hasn't been used since March 2023 when it was removed
from the Windows client in corp 66be796d33c.

So, delete.

Updates #11649

Change-Id: I40f2cb75fb3f43baf23558007655f65a8ec5e1b2
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2024-04-16 04:40:21 +00:00
+													UpdatePrefs: prefs,
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												})
-												wgengine/netstack: optimize shouldProcessInbound, avoiding 4via6 lookups

All IPv6 packets for the self address were doing netip.Prefix.Contains
lookups.

If if we know they're for a self address (which we already previously
computed and have sitting in a bool), then they can't be for a 4via6
range.

Change-Id: Iaaaf1248cb3fecec229935a80548ead0eb4cb892
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-11-09 03:53:40 +00:00
+												i.atomicIsLocalIPFunc.Store(looksLikeATailscaleSelfAddress)
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+											},
 											beforeStart: func(i *Impl) {
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												// This should be handled even if we're
 												// otherwise not processing local IPs or
 												// subnets.
 												i.ProcessLocalIPs = false
 												i.ProcessSubnets = false
 											},
 											want: true,
 										},
 										{
 											name: "ipv6-via-not-advertised",
 											pkt: &packet.Parsed{
 												IPVersion: 6,
 												IPProto:   ipproto.TCP,
 												Src:       netip.MustParseAddrPort("100.101.102.103:1234"),
 												// $ tailscale debug via 7 10.1.1.9/24
 												// fd7a:115c:a1e0:b1a:0:7:a01:109/120
 												Dst:      netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:7:a01:109]:5678"),
 												TCPFlags: packet.TCPSyn,
 											},
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+											afterStart: func(i *Impl) {
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												prefs := ipn.NewPrefs()
 												prefs.AdvertiseRoutes = []netip.Prefix{
 													// tailscale debug via 7 10.1.2.0/24
 													// fd7a:115c:a1e0:b1a:0:7:a01:200/120
 													netip.MustParsePrefix("fd7a:115c:a1e0:b1a:0:7:a01:200/120"),
 												}
 												i.lb.Start(ipn.Options{
-												ipn: remove unused Options.LegacyMigrationPrefs

I'm on a mission to simplify LocalBackend.Start and its locking
and deflake some tests.

I noticed this hasn't been used since March 2023 when it was removed
from the Windows client in corp 66be796d33c.

So, delete.

Updates #11649

Change-Id: I40f2cb75fb3f43baf23558007655f65a8ec5e1b2
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2024-04-16 04:40:21 +00:00
+													UpdatePrefs: prefs,
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												})
 											},
 											want: false,
 										},
 										{
 											name: "tailscale-ssh-enabled",
 											pkt: &packet.Parsed{
 												IPVersion: 4,
 												IPProto:   ipproto.TCP,
 												Src:       netip.MustParseAddrPort("100.101.102.103:1234"),
 												Dst:       netip.MustParseAddrPort("100.101.102.104:22"),
 												TCPFlags:  packet.TCPSyn,
 											},
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+											afterStart: func(i *Impl) {
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												prefs := ipn.NewPrefs()
 												prefs.RunSSH = true
 												i.lb.Start(ipn.Options{
-												ipn: remove unused Options.LegacyMigrationPrefs

I'm on a mission to simplify LocalBackend.Start and its locking
and deflake some tests.

I noticed this hasn't been used since March 2023 when it was removed
from the Windows client in corp 66be796d33c.

So, delete.

Updates #11649

Change-Id: I40f2cb75fb3f43baf23558007655f65a8ec5e1b2
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2024-04-16 04:40:21 +00:00
+													UpdatePrefs: prefs,
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												})
 												i.atomicIsLocalIPFunc.Store(func(addr netip.Addr) bool {
 													return addr.String() == "100.101.102.104" // Dst, above
 												})
 											},
-												ipn/ipnlocal: call checkPrefs in Start too

We were not calling checkPrefs on `opts.*Prefs` in (*LocalBackend).Start().

Updates #713

Signed-off-by: Maisem Ali <maisem@tailscale.com>

											
										
										
											2022-11-21 23:11:44 +00:00
+											want:      true,
 											runOnGOOS: "linux",
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+										},
 										{
 											name: "tailscale-ssh-disabled",
 											pkt: &packet.Parsed{
 												IPVersion: 4,
 												IPProto:   ipproto.TCP,
 												Src:       netip.MustParseAddrPort("100.101.102.103:1234"),
 												Dst:       netip.MustParseAddrPort("100.101.102.104:22"),
 												TCPFlags:  packet.TCPSyn,
 											},
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+											afterStart: func(i *Impl) {
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												prefs := ipn.NewPrefs()
 												prefs.RunSSH = false // default, but to be explicit
 												i.lb.Start(ipn.Options{
-												ipn: remove unused Options.LegacyMigrationPrefs

I'm on a mission to simplify LocalBackend.Start and its locking
and deflake some tests.

I noticed this hasn't been used since March 2023 when it was removed
from the Windows client in corp 66be796d33c.

So, delete.

Updates #11649

Change-Id: I40f2cb75fb3f43baf23558007655f65a8ec5e1b2
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2024-04-16 04:40:21 +00:00
+													UpdatePrefs: prefs,
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												})
 												i.atomicIsLocalIPFunc.Store(func(addr netip.Addr) bool {
 													return addr.String() == "100.101.102.104" // Dst, above
 												})
 											},
 											want: false,
 										},
 										{
 											name: "process-local-ips",
 											pkt: &packet.Parsed{
 												IPVersion: 4,
 												IPProto:   ipproto.TCP,
 												Src:       netip.MustParseAddrPort("100.101.102.103:1234"),
 												Dst:       netip.MustParseAddrPort("100.101.102.104:4567"),
 												TCPFlags:  packet.TCPSyn,
 											},
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+											afterStart: func(i *Impl) {
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												i.ProcessLocalIPs = true
 												i.atomicIsLocalIPFunc.Store(func(addr netip.Addr) bool {
 													return addr.String() == "100.101.102.104" // Dst, above
 												})
 											},
 											want: true,
 										},
 										{
 											name: "process-subnets",
 											pkt: &packet.Parsed{
 												IPVersion: 4,
 												IPProto:   ipproto.TCP,
 												Src:       netip.MustParseAddrPort("100.101.102.103:1234"),
 												Dst:       netip.MustParseAddrPort("10.1.2.3:4567"),
 												TCPFlags:  packet.TCPSyn,
 											},
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+											beforeStart: func(i *Impl) {
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												i.ProcessSubnets = true
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+											},
 											afterStart: func(i *Impl) {
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												// For testing purposes, assume all Tailscale
 												// IPs are local; the Dst above is something
 												// not in that range.
-												wgengine/netstack: optimize shouldProcessInbound, avoiding 4via6 lookups

All IPv6 packets for the self address were doing netip.Prefix.Contains
lookups.

If if we know they're for a self address (which we already previously
computed and have sitting in a bool), then they can't be for a 4via6
range.

Change-Id: Iaaaf1248cb3fecec229935a80548ead0eb4cb892
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-11-09 03:53:40 +00:00
+												i.atomicIsLocalIPFunc.Store(looksLikeATailscaleSelfAddress)
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+											},
 											want: true,
 										},
 										{
 											name: "peerapi-port-subnet-router", // see #6235
 											pkt: &packet.Parsed{
 												IPVersion: 4,
 												IPProto:   ipproto.TCP,
 												Src:       netip.MustParseAddrPort("100.101.102.103:1234"),
 												Dst:       netip.MustParseAddrPort("10.0.0.23:5555"),
 												TCPFlags:  packet.TCPSyn,
 											},
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+											beforeStart: func(i *Impl) {
 												// As if we were running on Linux where netstack isn't used.
 												i.ProcessSubnets = false
 												i.atomicIsLocalIPFunc.Store(func(netip.Addr) bool { return false })
 											},
 											afterStart: func(i *Impl) {
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												prefs := ipn.NewPrefs()
 												prefs.AdvertiseRoutes = []netip.Prefix{
 													netip.MustParsePrefix("10.0.0.1/24"),
 												}
 												i.lb.Start(ipn.Options{
-												ipn: remove unused Options.LegacyMigrationPrefs

I'm on a mission to simplify LocalBackend.Start and its locking
and deflake some tests.

I noticed this hasn't been used since March 2023 when it was removed
from the Windows client in corp 66be796d33c.

So, delete.

Updates #11649

Change-Id: I40f2cb75fb3f43baf23558007655f65a8ec5e1b2
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2024-04-16 04:40:21 +00:00
+													UpdatePrefs: prefs,
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+												})
 												// Set the PeerAPI port to the Dst port above.
-												wgengine/netstack: delete some dead code, old comment, use atomic int types

Noticed while looking at something else; #cleanup.

Change-Id: Icde7749363014eab9bebe1dd80708f5491f933d1
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-22 20:53:56 +00:00
+												i.peerapiPort4Atomic.Store(5555)
 												i.peerapiPort6Atomic.Store(5555)
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
+											},
 											want: false,
 										},
 										// TODO(andrew): test PeerAPI
 										// TODO(andrew): test TCP packets without the SYN flag set
 									}
 									for _, tc := range testCases {
 										t.Run(tc.name, func(t *testing.T) {
-												ipn/ipnlocal: call checkPrefs in Start too

We were not calling checkPrefs on `opts.*Prefs` in (*LocalBackend).Start().

Updates #713

Signed-off-by: Maisem Ali <maisem@tailscale.com>

											
										
										
											2022-11-21 23:11:44 +00:00
+											if tc.runOnGOOS != "" && runtime.GOOS != tc.runOnGOOS {
 												t.Skipf("skipping on GOOS=%v", runtime.GOOS)
 											}
-												wgengine/netstack: change netstack API to require LocalBackend

The macOS client was forgetting to call netstack.Impl.SetLocalBackend.
Change the API so that it can't be started without one, eliminating this
class of bug. Then update all the callers.

Updates #6764

Change-Id: I2b3a4f31fdfd9fdbbbbfe25a42db0c505373562f
Signed-off-by: Claire Wang <claire@tailscale.com>
Co-authored-by: Brad Fitzpatrick <bradfitz@tailscale.com>
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2022-12-23 18:22:39 +00:00
+											impl := makeNetstack(t, tc.beforeStart)
 											if tc.afterStart != nil {
 												tc.afterStart(impl)
 											}
-												wgengine/netstack: add tests for shouldProcessInbound

Inspired by #6235, let's explicitly test the behaviour of this function
to ensure that we're not processing things we don't expect to.

Change-Id: I158050a63be7410fb99452089ea607aaf89fe91a
Signed-off-by: Andrew Dunham <andrew@tailscale.com>

											
										
										
											2022-11-08 21:09:23 +00:00
 											got := impl.shouldProcessInbound(tc.pkt, nil)
 											if got != tc.want {
 												t.Errorf("got shouldProcessInbound()=%v; want %v", got, tc.want)
 											} else {
 												t.Logf("OK: shouldProcessInbound() = %v", got)
 											}
 										})
 									}
 								}
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
 								func tcp4syn(tb testing.TB, src, dst netip.Addr, sport, dport uint16) []byte {
 									ip := header.IPv4(make([]byte, header.IPv4MinimumSize+header.TCPMinimumSize))
 									ip.Encode(&header.IPv4Fields{
 										Protocol:    uint8(header.TCPProtocolNumber),
 										TotalLength: header.IPv4MinimumSize + header.TCPMinimumSize,
 										TTL:         64,
 										SrcAddr:     tcpip.AddrFrom4Slice(src.AsSlice()),
 										DstAddr:     tcpip.AddrFrom4Slice(dst.AsSlice()),
 									})
 									ip.SetChecksum(^ip.CalculateChecksum())
 									if !ip.IsChecksumValid() {
 										tb.Fatal("test broken; packet has incorrect IP checksum")
 									}
 									tcp := header.TCP(ip[header.IPv4MinimumSize:])
 									tcp.Encode(&header.TCPFields{
 										SrcPort:    sport,
 										DstPort:    dport,
 										SeqNum:     0,
 										DataOffset: header.TCPMinimumSize,
 										Flags:      header.TCPFlagSyn,
 										WindowSize: 65535,
 										Checksum:   0,
 									})
 									xsum := header.PseudoHeaderChecksum(
 										header.TCPProtocolNumber,
 										tcpip.AddrFrom4Slice(src.AsSlice()),
 										tcpip.AddrFrom4Slice(dst.AsSlice()),
 										uint16(header.TCPMinimumSize),
 									)
 									tcp.SetChecksum(^tcp.CalculateChecksum(xsum))
 									if !tcp.IsChecksumValid(tcpip.AddrFrom4Slice(src.AsSlice()), tcpip.AddrFrom4Slice(dst.AsSlice()), 0, 0) {
 										tb.Fatal("test broken; packet has incorrect TCP checksum")
 									}
 									return ip
 								}
 								// makeHangDialer returns a dialer that notifies the returned channel when a
 								// connection is dialed and then hangs until the test finishes.
 								func makeHangDialer(tb testing.TB) (func(context.Context, string, string) (net.Conn, error), chan struct{}) {
 									done := make(chan struct{})
 									tb.Cleanup(func() {
 										close(done)
 									})
 									gotConn := make(chan struct{}, 1)
 									fn := func(ctx context.Context, network, address string) (net.Conn, error) {
 										// Signal that we have a new connection
 										tb.Logf("hangDialer: called with network=%q address=%q", network, address)
 										select {
 										case gotConn <- struct{}{}:
 										default:
 										}
 										// Hang until the test is done.
 										select {
 										case <-ctx.Done():
 											tb.Logf("context done")
 										case <-done:
 											tb.Logf("function completed")
 										}
 										return nil, fmt.Errorf("canceled")
 									}
 									return fn, gotConn
 								}
 								// TestTCPForwardLimits verifies that the limits on the TCP forwarder work in a
 								// success case (i.e. when we don't hit the limit).
 								func TestTCPForwardLimits(t *testing.T) {
 									envknob.Setenv("TS_DEBUG_NETSTACK", "true")
 									impl := makeNetstack(t, func(impl *Impl) {
 										impl.ProcessSubnets = true
 									})
 									dialFn, gotConn := makeHangDialer(t)
 									impl.forwardDialFunc = dialFn
 									prefs := ipn.NewPrefs()
 									prefs.AdvertiseRoutes = []netip.Prefix{
 										// This is the TEST-NET-1 IP block for use in documentation,
 										// and should never actually be routable.
 										netip.MustParsePrefix("192.0.2.0/24"),
 									}
 									impl.lb.Start(ipn.Options{
-												ipn: remove unused Options.LegacyMigrationPrefs

I'm on a mission to simplify LocalBackend.Start and its locking
and deflake some tests.

I noticed this hasn't been used since March 2023 when it was removed
from the Windows client in corp 66be796d33c.

So, delete.

Updates #11649

Change-Id: I40f2cb75fb3f43baf23558007655f65a8ec5e1b2
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2024-04-16 04:40:21 +00:00
+										UpdatePrefs: prefs,
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
+									})
 									impl.atomicIsLocalIPFunc.Store(looksLikeATailscaleSelfAddress)
 									// Inject an "outbound" packet that's going to an IP address that times
 									// out. We need to re-parse from a byte slice so that the internal
 									// buffer in the packet.Parsed type is filled out.
 									client := netip.MustParseAddr("100.101.102.103")
 									destAddr := netip.MustParseAddr("192.0.2.1")
 									pkt := tcp4syn(t, client, destAddr, 1234, 4567)
 									var parsed packet.Parsed
 									parsed.Decode(pkt)
 									// When injecting this packet, we want the outcome to be "drop
 									// silently", which indicates that netstack is processing the
 									// packet and not delivering it to the host system.
-												net/tstun,wgengine{/netstack/gro}: refactor and re-enable gVisor GRO for Linux (#13172)

In 2f27319baf71681e221904d3a3ffe1badedc8e2e we disabled GRO due to a
data race around concurrent calls to tstun.Wrapper.Write(). This commit
refactors GRO to be thread-safe, and re-enables it on Linux.

This refactor now carries a GRO type across tstun and netstack APIs
with a lifetime that is scoped to a single tstun.Wrapper.Write() call.

In 25f0a3fc8f6f9cf681bb5afda8e1762816c67a8b we used build tags to
prevent importation of gVisor's GRO package on iOS as at the time we
believed it was contributing to additional memory usage on that
platform. It wasn't, so this commit simplifies and removes those
build tags.

Updates tailscale/corp#22353
Updates tailscale/corp#22125
Updates #6816

Signed-off-by: Jordan Whited <jordan@tailscale.com>
											
										
										
											2024-08-20 22:22:19 +00:00
+									if resp, _ := impl.injectInbound(&parsed, impl.tundev, nil); resp != filter.DropSilently {
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
+										t.Errorf("got filter outcome %v, want filter.DropSilently", resp)
 									}
 									ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
 									defer cancel()
 									// Wait until we have an in-flight outgoing connection.
 									select {
 									case <-ctx.Done():
 										t.Fatalf("timed out waiting for connection")
 									case <-gotConn:
 										t.Logf("got connection in progress")
 									}
-												wgengine/netstack: fix bug with duplicate SYN packets in client limit

This fixes a bug that was introduced in #11258 where the handling of the
per-client limit didn't properly account for the fact that the gVisor
TCP forwarder will return 'true' to indicate that it's handled a
duplicate SYN packet, but not launch the handler goroutine.

In such a case, we neither decremented our per-client limit in the
wrapper function, nor did we do so in the handler function, leading to
our per-client limit table slowly filling up without bound.

Fix this by doing the same duplicate-tracking logic that the TCP
forwarder does so we can detect such cases and appropriately decrement
our in-flight counter.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ib6011a71d382a10d68c0802593f34b8153d06892

											
										
										
											2024-02-29 04:21:31 +00:00
+									// Inject another packet, which will be deduplicated and thus not
 									// increment our counter.
 									parsed.Decode(pkt)
-												net/tstun,wgengine{/netstack/gro}: refactor and re-enable gVisor GRO for Linux (#13172)

In 2f27319baf71681e221904d3a3ffe1badedc8e2e we disabled GRO due to a
data race around concurrent calls to tstun.Wrapper.Write(). This commit
refactors GRO to be thread-safe, and re-enables it on Linux.

This refactor now carries a GRO type across tstun and netstack APIs
with a lifetime that is scoped to a single tstun.Wrapper.Write() call.

In 25f0a3fc8f6f9cf681bb5afda8e1762816c67a8b we used build tags to
prevent importation of gVisor's GRO package on iOS as at the time we
believed it was contributing to additional memory usage on that
platform. It wasn't, so this commit simplifies and removes those
build tags.

Updates tailscale/corp#22353
Updates tailscale/corp#22125
Updates #6816

Signed-off-by: Jordan Whited <jordan@tailscale.com>
											
										
										
											2024-08-20 22:22:19 +00:00
+									if resp, _ := impl.injectInbound(&parsed, impl.tundev, nil); resp != filter.DropSilently {
-												wgengine/netstack: fix bug with duplicate SYN packets in client limit

This fixes a bug that was introduced in #11258 where the handling of the
per-client limit didn't properly account for the fact that the gVisor
TCP forwarder will return 'true' to indicate that it's handled a
duplicate SYN packet, but not launch the handler goroutine.

In such a case, we neither decremented our per-client limit in the
wrapper function, nor did we do so in the handler function, leading to
our per-client limit table slowly filling up without bound.

Fix this by doing the same duplicate-tracking logic that the TCP
forwarder does so we can detect such cases and appropriately decrement
our in-flight counter.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ib6011a71d382a10d68c0802593f34b8153d06892

											
										
										
											2024-02-29 04:21:31 +00:00
+										t.Errorf("got filter outcome %v, want filter.DropSilently", resp)
 									}
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
+									// Verify that we now have a single in-flight address in our map.
 									impl.mu.Lock()
 									inFlight := maps.Clone(impl.connsInFlightByClient)
 									impl.mu.Unlock()
 									if got, ok := inFlight[client]; !ok || got != 1 {
 										t.Errorf("expected 1 in-flight connection for %v, got: %v", client, inFlight)
 									}
 									// Get the expvar statistics and verify that we're exporting the
 									// correct metric.
 									metrics := impl.ExpVar().(*metrics.Set)
 									const metricName = "gauge_tcp_forward_in_flight"
 									if v := metrics.Get(metricName).String(); v != "1" {
 										t.Errorf("got metric %q=%s, want 1", metricName, v)
 									}
 								}
 								// TestTCPForwardLimits_PerClient verifies that the per-client limit for TCP
 								// forwarding works.
 								func TestTCPForwardLimits_PerClient(t *testing.T) {
 									envknob.Setenv("TS_DEBUG_NETSTACK", "true")
 									// Set our test override limits during this test.
 									tstest.Replace(t, &maxInFlightConnectionAttemptsForTest, 2)
 									tstest.Replace(t, &maxInFlightConnectionAttemptsPerClientForTest, 1)
 									impl := makeNetstack(t, func(impl *Impl) {
 										impl.ProcessSubnets = true
 									})
 									dialFn, gotConn := makeHangDialer(t)
 									impl.forwardDialFunc = dialFn
 									prefs := ipn.NewPrefs()
 									prefs.AdvertiseRoutes = []netip.Prefix{
 										// This is the TEST-NET-1 IP block for use in documentation,
 										// and should never actually be routable.
 										netip.MustParsePrefix("192.0.2.0/24"),
 									}
 									impl.lb.Start(ipn.Options{
-												ipn: remove unused Options.LegacyMigrationPrefs

I'm on a mission to simplify LocalBackend.Start and its locking
and deflake some tests.

I noticed this hasn't been used since March 2023 when it was removed
from the Windows client in corp 66be796d33c.

So, delete.

Updates #11649

Change-Id: I40f2cb75fb3f43baf23558007655f65a8ec5e1b2
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>

											
										
										
											2024-04-16 04:40:21 +00:00
+										UpdatePrefs: prefs,
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
+									})
 									impl.atomicIsLocalIPFunc.Store(looksLikeATailscaleSelfAddress)
 									// Inject an "outbound" packet that's going to an IP address that times
 									// out. We need to re-parse from a byte slice so that the internal
 									// buffer in the packet.Parsed type is filled out.
 									client := netip.MustParseAddr("100.101.102.103")
 									destAddr := netip.MustParseAddr("192.0.2.1")
 									// Helpers
-												wgengine/netstack: fix bug with duplicate SYN packets in client limit

This fixes a bug that was introduced in #11258 where the handling of the
per-client limit didn't properly account for the fact that the gVisor
TCP forwarder will return 'true' to indicate that it's handled a
duplicate SYN packet, but not launch the handler goroutine.

In such a case, we neither decremented our per-client limit in the
wrapper function, nor did we do so in the handler function, leading to
our per-client limit table slowly filling up without bound.

Fix this by doing the same duplicate-tracking logic that the TCP
forwarder does so we can detect such cases and appropriately decrement
our in-flight counter.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ib6011a71d382a10d68c0802593f34b8153d06892

											
										
										
											2024-02-29 04:21:31 +00:00
+									var port uint16 = 1234
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
+									mustInjectPacket := func() {
-												wgengine/netstack: fix bug with duplicate SYN packets in client limit

This fixes a bug that was introduced in #11258 where the handling of the
per-client limit didn't properly account for the fact that the gVisor
TCP forwarder will return 'true' to indicate that it's handled a
duplicate SYN packet, but not launch the handler goroutine.

In such a case, we neither decremented our per-client limit in the
wrapper function, nor did we do so in the handler function, leading to
our per-client limit table slowly filling up without bound.

Fix this by doing the same duplicate-tracking logic that the TCP
forwarder does so we can detect such cases and appropriately decrement
our in-flight counter.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ib6011a71d382a10d68c0802593f34b8153d06892

											
										
										
											2024-02-29 04:21:31 +00:00
+										pkt := tcp4syn(t, client, destAddr, port, 4567)
 										port++ // to avoid deduplication based on endpoint
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
+										var parsed packet.Parsed
 										parsed.Decode(pkt)
 										// When injecting this packet, we want the outcome to be "drop
 										// silently", which indicates that netstack is processing the
 										// packet and not delivering it to the host system.
-												net/tstun,wgengine{/netstack/gro}: refactor and re-enable gVisor GRO for Linux (#13172)

In 2f27319baf71681e221904d3a3ffe1badedc8e2e we disabled GRO due to a
data race around concurrent calls to tstun.Wrapper.Write(). This commit
refactors GRO to be thread-safe, and re-enables it on Linux.

This refactor now carries a GRO type across tstun and netstack APIs
with a lifetime that is scoped to a single tstun.Wrapper.Write() call.

In 25f0a3fc8f6f9cf681bb5afda8e1762816c67a8b we used build tags to
prevent importation of gVisor's GRO package on iOS as at the time we
believed it was contributing to additional memory usage on that
platform. It wasn't, so this commit simplifies and removes those
build tags.

Updates tailscale/corp#22353
Updates tailscale/corp#22125
Updates #6816

Signed-off-by: Jordan Whited <jordan@tailscale.com>
											
										
										
											2024-08-20 22:22:19 +00:00
+										if resp, _ := impl.injectInbound(&parsed, impl.tundev, nil); resp != filter.DropSilently {
-												wgengine/netstack: add a per-client limit for in-flight TCP forwards

This is a fun one. Right now, when a client is connecting through a
subnet router, here's roughly what happens:

1. The client initiates a connection to an IP address behind a subnet
   router, and sends a TCP SYN
2. The subnet router gets the SYN packet from netstack, and after
   running through acceptTCP, starts DialContext-ing the destination IP,
   without accepting the connection¹
3. The client retransmits the SYN packet a few times while the dial is
   in progress, until either...
4. The subnet router successfully establishes a connection to the
   destination IP and sends the SYN-ACK back to the client, or...
5. The subnet router times out and sends a RST to the client.
6. If the connection was successful, the client ACKs the SYN-ACK it
   received, and traffic starts flowing

As a result, the notification code in forwardTCP never notices when a
new connection attempt is aborted, and it will wait until either the
connection is established, or until the OS-level connection timeout is
reached and it aborts.

To mitigate this, add a per-client limit on how many in-flight TCP
forwarding connections can be in-progress; after this, clients will see
a similar behaviour to the global limit, where new connection attempts
are aborted instead of waiting. This prevents a single misbehaving
client from blocking all other clients of a subnet router by ensuring
that it doesn't starve the global limiter.

Also, bump the global limit again to a higher value.

¹ We can't accept the connection before establishing a connection to the
remote server since otherwise we'd be opening the connection and then
immediately closing it, which breaks a bunch of stuff; see #5503 for
more details.

Updates tailscale/corp#12184

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: I76e7008ddd497303d75d473f534e32309c8a5144

											
										
										
											2024-02-26 20:06:47 +00:00
+											t.Fatalf("got filter outcome %v, want filter.DropSilently", resp)
 										}
 									}
 									ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
 									defer cancel()
 									waitPacket := func() {
 										select {
 										case <-ctx.Done():
 											t.Fatalf("timed out waiting for connection")
 										case <-gotConn:
 											t.Logf("got connection in progress")
 										}
 									}
 									// Inject the packet to start the TCP forward and wait until we have an
 									// in-flight outgoing connection.
 									mustInjectPacket()
 									waitPacket()
 									// Verify that we now have a single in-flight address in our map.
 									impl.mu.Lock()
 									inFlight := maps.Clone(impl.connsInFlightByClient)
 									impl.mu.Unlock()
 									if got, ok := inFlight[client]; !ok || got != 1 {
 										t.Errorf("expected 1 in-flight connection for %v, got: %v", client, inFlight)
 									}
 									metrics := impl.ExpVar().(*metrics.Set)
 									// One client should have reached the limit at this point.
 									if v := metrics.Get("gauge_tcp_forward_in_flight_per_client_limit_reached").String(); v != "1" {
 										t.Errorf("got limit reached expvar metric=%s, want 1", v)
 									}
 									// Inject another packet, and verify that we've incremented our
 									// "dropped" metrics since this will have been dropped.
 									mustInjectPacket()
 									// expvar metric
 									const metricName = "counter_tcp_forward_max_in_flight_per_client_drop"
 									if v := metrics.Get(metricName).String(); v != "1" {
 										t.Errorf("got expvar metric %q=%s, want 1", metricName, v)
 									}
 									// client metric
 									if v := metricPerClientForwardLimit.Value(); v != 1 {
 										t.Errorf("got clientmetric limit metric=%d, want 1", v)
 									}
 								}
-												wgengine/netstack: handle 4via6 routes that are advertised by the same node

Previously, a node that was advertising a 4via6 route wouldn't be able
to make use of that same route; the packet would be delivered to
Tailscale, but since we weren't accepting it in handleLocalPackets, the
packet wouldn't be delivered to netstack and would never hit the 4via6
logic. Let's add that support so that usage of 4via6 is consistent
regardless of where the connection is initiated from.

Updates #11304

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ic28dc2e58080d76100d73b93360f4698605af7cb

											
										
										
											2024-05-05 22:00:19 +00:00
 								// TestHandleLocalPackets tests the handleLocalPackets function, ensuring that
 								// we are properly deciding to handle packets that are destined for "local"
 								// IPs–addresses that are either for this node, or that it is responsible for.
 								//
 								// See, e.g. #11304
 								func TestHandleLocalPackets(t *testing.T) {
 									var (
 										selfIP4 = netip.MustParseAddr("100.64.1.2")
 										selfIP6 = netip.MustParseAddr("fd7a:115c:a1e0::123")
 									)
 									impl := makeNetstack(t, func(impl *Impl) {
 										impl.ProcessSubnets = false
 										impl.ProcessLocalIPs = false
 										impl.atomicIsLocalIPFunc.Store(func(addr netip.Addr) bool {
 											return addr == selfIP4 || addr == selfIP6
 										})
 									})
 									prefs := ipn.NewPrefs()
 									prefs.AdvertiseRoutes = []netip.Prefix{
 										// $ tailscale debug via 7 10.1.1.0/24
 										// fd7a:115c:a1e0:b1a:0:7:a01:100/120
 										netip.MustParsePrefix("fd7a:115c:a1e0:b1a:0:7:a01:100/120"),
 									}
 									_, err := impl.lb.EditPrefs(&ipn.MaskedPrefs{
 										Prefs:              *prefs,
 										AdvertiseRoutesSet: true,
 									})
 									if err != nil {
 										t.Fatalf("EditPrefs: %v", err)
 									}
 									t.Run("ShouldHandleServiceIP", func(t *testing.T) {
 										pkt := &packet.Parsed{
 											IPVersion: 4,
 											IPProto:   ipproto.TCP,
 											Src:       netip.MustParseAddrPort("127.0.0.1:9999"),
 											Dst:       netip.MustParseAddrPort("100.100.100.100:53"),
 											TCPFlags:  packet.TCPSyn,
 										}
-												net/tstun,wgengine/netstack: implement TCP GRO for local services (#13315)

Throughput improves substantially when measured via netstack loopback
(TS_DEBUG_NETSTACK_LOOPBACK_PORT).

Before (d21ebc2):
jwhited@i5-12400-2:~$ iperf3 -V -c 100.100.100.100
Starting Test: protocol: TCP, 1 streams, 131072 byte blocks
Test Complete. Summary Results:
[ ID] Interval           Transfer     Bitrate         Retr
[  5]   0.00-10.00  sec  5.77 GBytes  4.95 Gbits/sec    0 sender
[  5]   0.00-10.01  sec  5.77 GBytes  4.95 Gbits/sec      receiver

After:
jwhited@i5-12400-2:~$ iperf3 -V -c 100.100.100.100
Starting Test: protocol: TCP, 1 streams, 131072 byte blocks
Test Complete. Summary Results:
[ ID] Interval           Transfer     Bitrate         Retr
[  5]   0.00-10.00  sec  12.7 GBytes  10.9 Gbits/sec    0 sender
[  5]   0.00-10.00  sec  12.7 GBytes  10.9 Gbits/sec      receiver

Updates tailscale/corp#22754

Signed-off-by: Jordan Whited <jordan@tailscale.com>
											
										
										
											2024-08-29 18:37:48 +00:00
+										resp, _ := impl.handleLocalPackets(pkt, impl.tundev, nil)
-												wgengine/netstack: handle 4via6 routes that are advertised by the same node

Previously, a node that was advertising a 4via6 route wouldn't be able
to make use of that same route; the packet would be delivered to
Tailscale, but since we weren't accepting it in handleLocalPackets, the
packet wouldn't be delivered to netstack and would never hit the 4via6
logic. Let's add that support so that usage of 4via6 is consistent
regardless of where the connection is initiated from.

Updates #11304

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ic28dc2e58080d76100d73b93360f4698605af7cb

											
										
										
											2024-05-05 22:00:19 +00:00
+										if resp != filter.DropSilently {
 											t.Errorf("got filter outcome %v, want filter.DropSilently", resp)
 										}
 									})
 									t.Run("ShouldHandle4via6", func(t *testing.T) {
 										pkt := &packet.Parsed{
 											IPVersion: 6,
 											IPProto:   ipproto.TCP,
 											Src:       netip.MustParseAddrPort("[::1]:1234"),
 											// This is an IP in the above 4via6 subnet that this node handles.
 											//    $ tailscale debug via 7 10.1.1.9/24
 											//    fd7a:115c:a1e0:b1a:0:7:a01:109/120
 											Dst:      netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:7:a01:109]:5678"),
 											TCPFlags: packet.TCPSyn,
 										}
-												net/tstun,wgengine/netstack: implement TCP GRO for local services (#13315)

Throughput improves substantially when measured via netstack loopback
(TS_DEBUG_NETSTACK_LOOPBACK_PORT).

Before (d21ebc2):
jwhited@i5-12400-2:~$ iperf3 -V -c 100.100.100.100
Starting Test: protocol: TCP, 1 streams, 131072 byte blocks
Test Complete. Summary Results:
[ ID] Interval           Transfer     Bitrate         Retr
[  5]   0.00-10.00  sec  5.77 GBytes  4.95 Gbits/sec    0 sender
[  5]   0.00-10.01  sec  5.77 GBytes  4.95 Gbits/sec      receiver

After:
jwhited@i5-12400-2:~$ iperf3 -V -c 100.100.100.100
Starting Test: protocol: TCP, 1 streams, 131072 byte blocks
Test Complete. Summary Results:
[ ID] Interval           Transfer     Bitrate         Retr
[  5]   0.00-10.00  sec  12.7 GBytes  10.9 Gbits/sec    0 sender
[  5]   0.00-10.00  sec  12.7 GBytes  10.9 Gbits/sec      receiver

Updates tailscale/corp#22754

Signed-off-by: Jordan Whited <jordan@tailscale.com>
											
										
										
											2024-08-29 18:37:48 +00:00
+										resp, _ := impl.handleLocalPackets(pkt, impl.tundev, nil)
-												wgengine/netstack: handle 4via6 routes that are advertised by the same node

Previously, a node that was advertising a 4via6 route wouldn't be able
to make use of that same route; the packet would be delivered to
Tailscale, but since we weren't accepting it in handleLocalPackets, the
packet wouldn't be delivered to netstack and would never hit the 4via6
logic. Let's add that support so that usage of 4via6 is consistent
regardless of where the connection is initiated from.

Updates #11304

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ic28dc2e58080d76100d73b93360f4698605af7cb

											
										
										
											2024-05-05 22:00:19 +00:00
 										// DropSilently is the outcome we expected, since we actually
 										// handled this packet by injecting it into netstack, which
 										// will handle creating the TCP forwarder. We drop it so we
 										// don't process the packet outside of netstack.
 										if resp != filter.DropSilently {
 											t.Errorf("got filter outcome %v, want filter.DropSilently", resp)
 										}
 									})
 									t.Run("OtherNonHandled", func(t *testing.T) {
 										pkt := &packet.Parsed{
 											IPVersion: 6,
 											IPProto:   ipproto.TCP,
 											Src:       netip.MustParseAddrPort("[::1]:1234"),
 											// This IP is *not* in the above 4via6 route
 											//    $ tailscale debug via 99 10.1.1.9/24
 											//    fd7a:115c:a1e0:b1a:0:63:a01:109/120
 											Dst:      netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:63:a01:109]:5678"),
 											TCPFlags: packet.TCPSyn,
 										}
-												net/tstun,wgengine/netstack: implement TCP GRO for local services (#13315)

Throughput improves substantially when measured via netstack loopback
(TS_DEBUG_NETSTACK_LOOPBACK_PORT).

Before (d21ebc2):
jwhited@i5-12400-2:~$ iperf3 -V -c 100.100.100.100
Starting Test: protocol: TCP, 1 streams, 131072 byte blocks
Test Complete. Summary Results:
[ ID] Interval           Transfer     Bitrate         Retr
[  5]   0.00-10.00  sec  5.77 GBytes  4.95 Gbits/sec    0 sender
[  5]   0.00-10.01  sec  5.77 GBytes  4.95 Gbits/sec      receiver

After:
jwhited@i5-12400-2:~$ iperf3 -V -c 100.100.100.100
Starting Test: protocol: TCP, 1 streams, 131072 byte blocks
Test Complete. Summary Results:
[ ID] Interval           Transfer     Bitrate         Retr
[  5]   0.00-10.00  sec  12.7 GBytes  10.9 Gbits/sec    0 sender
[  5]   0.00-10.00  sec  12.7 GBytes  10.9 Gbits/sec      receiver

Updates tailscale/corp#22754

Signed-off-by: Jordan Whited <jordan@tailscale.com>
											
										
										
											2024-08-29 18:37:48 +00:00
+										resp, _ := impl.handleLocalPackets(pkt, impl.tundev, nil)
-												wgengine/netstack: handle 4via6 routes that are advertised by the same node

Previously, a node that was advertising a 4via6 route wouldn't be able
to make use of that same route; the packet would be delivered to
Tailscale, but since we weren't accepting it in handleLocalPackets, the
packet wouldn't be delivered to netstack and would never hit the 4via6
logic. Let's add that support so that usage of 4via6 is consistent
regardless of where the connection is initiated from.

Updates #11304

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ic28dc2e58080d76100d73b93360f4698605af7cb

											
										
										
											2024-05-05 22:00:19 +00:00
 										// Accept means that handleLocalPackets does not handle this
 										// packet, we "accept" it to continue further processing,
 										// instead of dropping because it was already handled.
 										if resp != filter.Accept {
 											t.Errorf("got filter outcome %v, want filter.Accept", resp)
 										}
 									})
 								}
-												wgengine/netstack: add test for #12448

This refactors the logic for determining whether a packet should be sent
to the host or not into a function, and then adds tests for it.

Updates #11304
Updates #12448

Signed-off-by: Andrew Dunham <andrew@du.nham.ca>
Change-Id: Ief9afa98eaffae00e21ceb7db073c61b170355e5

											
										
										
											2024-06-13 17:48:45 +00:00
 								func TestShouldSendToHost(t *testing.T) {
 									var (
 										selfIP4 = netip.MustParseAddr("100.64.1.2")
 										selfIP6 = netip.MustParseAddr("fd7a:115c:a1e0::123")
 									)
 									makeTestNetstack := func(tb testing.TB) *Impl {
 										impl := makeNetstack(tb, func(impl *Impl) {
 											impl.ProcessSubnets = false
 											impl.ProcessLocalIPs = false
 											impl.atomicIsLocalIPFunc.Store(func(addr netip.Addr) bool {
 												return addr == selfIP4 || addr == selfIP6
 											})
 										})
 										prefs := ipn.NewPrefs()
 										prefs.AdvertiseRoutes = []netip.Prefix{
 											// $ tailscale debug via 7 10.1.1.0/24
 											// fd7a:115c:a1e0:b1a:0:7:a01:100/120
 											netip.MustParsePrefix("fd7a:115c:a1e0:b1a:0:7:a01:100/120"),
 										}
 										_, err := impl.lb.EditPrefs(&ipn.MaskedPrefs{
 											Prefs:              *prefs,
 											AdvertiseRoutesSet: true,
 										})
 										if err != nil {
 											tb.Fatalf("EditPrefs: %v", err)
 										}
 										return impl
 									}
 									testCases := []struct {
 										name     string
 										src, dst netip.AddrPort
 										want     bool
 									}{
 										// Reply from service IP to localhost should be sent to host,
 										// not over WireGuard.
 										{
 											name: "from_service_ip_to_localhost",
 											src:  netip.AddrPortFrom(serviceIP, 53),
 											dst:  netip.MustParseAddrPort("127.0.0.1:9999"),
 											want: true,
 										},
 										{
 											name: "from_service_ip_to_localhost_v6",
 											src:  netip.AddrPortFrom(serviceIPv6, 53),
 											dst:  netip.MustParseAddrPort("[::1]:9999"),
 											want: true,
 										},
 										// A reply from the local IP to a remote host isn't sent to the
 										// host, but rather over WireGuard.
 										{
 											name: "local_ip_to_remote",
 											src:  netip.AddrPortFrom(selfIP4, 12345),
 											dst:  netip.MustParseAddrPort("100.64.99.88:7777"),
 											want: false,
 										},
 										{
 											name: "local_ip_to_remote_v6",
 											src:  netip.AddrPortFrom(selfIP6, 12345),
 											dst:  netip.MustParseAddrPort("[fd7a:115:a1e0::99]:7777"),
 											want: false,
 										},
 										// A reply from a 4via6 address to a remote host isn't sent to
 										// the local host, but rather over WireGuard. See:
 										//     https://github.com/tailscale/tailscale/issues/12448
 										{
 											name: "4via6_to_remote",
 											// $ tailscale debug via 7 10.1.1.99/24
 											// fd7a:115c:a1e0:b1a:0:7:a01:163/120
 											src:  netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:7:a01:163]:12345"),
 											dst:  netip.MustParseAddrPort("[fd7a:115:a1e0::99]:7777"),
 											want: false,
 										},
 										// However, a reply from a 4via6 address to the local Tailscale
 										// IP for this host *is* sent to the local host. See:
 										//     https://github.com/tailscale/tailscale/issues/11304
 										{
 											name: "4via6_to_local",
 											// $ tailscale debug via 7 10.1.1.99/24
 											// fd7a:115c:a1e0:b1a:0:7:a01:163/120
 											src:  netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:7:a01:163]:12345"),
 											dst:  netip.AddrPortFrom(selfIP6, 7777),
 											want: true,
 										},
 										// Traffic from a 4via6 address that we're not handling to
 										// either the local Tailscale IP or a remote host is sent
 										// outbound.
 										//
 										// In most cases, we won't see this type of traffic in the
 										// shouldSendToHost function, but let's confirm.
 										{
 											name: "other_4via6_to_local",
 											// $ tailscale debug via 4444 10.1.1.88/24
 											// fd7a:115c:a1e0:b1a:0:7:a01:163/120
 											src:  netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:115c:a01:158]:12345"),
 											dst:  netip.AddrPortFrom(selfIP6, 7777),
 											want: false,
 										},
 										{
 											name: "other_4via6_to_remote",
 											// $ tailscale debug via 4444 10.1.1.88/24
 											// fd7a:115c:a1e0:b1a:0:7:a01:163/120
 											src:  netip.MustParseAddrPort("[fd7a:115c:a1e0:b1a:0:115c:a01:158]:12345"),
 											dst:  netip.MustParseAddrPort("[fd7a:115:a1e0::99]:7777"),
 											want: false,
 										},
 									}
 									for _, tt := range testCases {
 										t.Run(tt.name, func(t *testing.T) {
 											var pkt *stack.PacketBuffer
 											if tt.src.Addr().Is4() {
 												pkt = makeUDP4PacketBuffer(tt.src, tt.dst)
 											} else {
 												pkt = makeUDP6PacketBuffer(tt.src, tt.dst)
 											}
 											ns := makeTestNetstack(t)
 											if got := ns.shouldSendToHost(pkt); got != tt.want {
 												t.Errorf("shouldSendToHost returned %v, want %v", got, tt.want)
 											}
 										})
 									}
 								}
 								func makeUDP4PacketBuffer(src, dst netip.AddrPort) *stack.PacketBuffer {
 									if !src.Addr().Is4() || !dst.Addr().Is4() {
 										panic("src and dst must be IPv4")
 									}
 									data := []byte("hello world\n")
 									packetLen := header.IPv4MinimumSize + header.UDPMinimumSize
 									pkt := stack.NewPacketBuffer(stack.PacketBufferOptions{
 										ReserveHeaderBytes: packetLen,
 										Payload:            buffer.MakeWithData(data),
 									})
 									// Initialize the UDP header.
 									udp := header.UDP(pkt.TransportHeader().Push(header.UDPMinimumSize))
 									pkt.TransportProtocolNumber = header.UDPProtocolNumber
 									length := uint16(pkt.Size())
 									udp.Encode(&header.UDPFields{
 										SrcPort: src.Port(),
 										DstPort: dst.Port(),
 										Length:  length,
 									})
 									// Add IP header
 									ipHdr := header.IPv4(pkt.NetworkHeader().Push(header.IPv4MinimumSize))
 									pkt.NetworkProtocolNumber = header.IPv4ProtocolNumber
 									ipHdr.Encode(&header.IPv4Fields{
 										TotalLength: uint16(packetLen),
 										Protocol:    uint8(header.UDPProtocolNumber),
 										SrcAddr:     tcpip.AddrFrom4(src.Addr().As4()),
 										DstAddr:     tcpip.AddrFrom4(dst.Addr().As4()),
 										Checksum:    0,
 									})
 									return pkt
 								}
 								func makeUDP6PacketBuffer(src, dst netip.AddrPort) *stack.PacketBuffer {
 									if !src.Addr().Is6() || !dst.Addr().Is6() {
 										panic("src and dst must be IPv6")
 									}
 									data := []byte("hello world\n")
 									packetLen := header.IPv6MinimumSize + header.UDPMinimumSize
 									pkt := stack.NewPacketBuffer(stack.PacketBufferOptions{
 										ReserveHeaderBytes: packetLen,
 										Payload:            buffer.MakeWithData(data),
 									})
 									srcAddr := tcpip.AddrFrom16(src.Addr().As16())
 									dstAddr := tcpip.AddrFrom16(dst.Addr().As16())
 									// Add IP header
 									ipHdr := header.IPv6(pkt.NetworkHeader().Push(header.IPv6MinimumSize))
 									pkt.NetworkProtocolNumber = header.IPv6ProtocolNumber
 									ipHdr.Encode(&header.IPv6Fields{
 										SrcAddr:           srcAddr,
 										DstAddr:           dstAddr,
 										PayloadLength:     uint16(header.UDPMinimumSize + len(data)),
 										TransportProtocol: header.UDPProtocolNumber,
 										HopLimit:          64,
 									})
 									// Initialize the UDP header.
 									udp := header.UDP(pkt.TransportHeader().Push(header.UDPMinimumSize))
 									pkt.TransportProtocolNumber = header.UDPProtocolNumber
 									length := uint16(pkt.Size())
 									udp.Encode(&header.UDPFields{
 										SrcPort: src.Port(),
 										DstPort: dst.Port(),
 										Length:  length,
 									})
 									// Calculate the UDP pseudo-header checksum.
 									xsum := header.PseudoHeaderChecksum(header.UDPProtocolNumber, srcAddr, dstAddr, uint16(len(udp)))
 									udp.SetChecksum(^udp.CalculateChecksum(xsum))
 									return pkt
 								}