2023-01-27 13:37:20 -08:00
|
|
|
// Copyright (c) Tailscale Inc & AUTHORS
|
|
|
|
// SPDX-License-Identifier: BSD-3-Clause
|
2020-03-05 10:29:19 -08:00
|
|
|
|
|
|
|
// Package dnscache contains a minimal DNS cache that makes a bunch of
|
|
|
|
// assumptions that are only valid for us. Not recommended for general use.
|
|
|
|
package dnscache
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
2021-02-26 12:49:54 -08:00
|
|
|
"crypto/tls"
|
|
|
|
"errors"
|
2020-03-05 10:29:19 -08:00
|
|
|
"fmt"
|
2020-11-11 12:37:53 -08:00
|
|
|
"log"
|
2020-03-05 10:29:19 -08:00
|
|
|
"net"
|
all: convert more code to use net/netip directly
perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
goimports -w .
Then delete some stuff from the net/netaddr shim package which is no
longer neeed.
Updates #5162
Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-07-25 21:14:09 -07:00
|
|
|
"net/netip"
|
2020-03-09 14:19:29 -04:00
|
|
|
"runtime"
|
2020-03-05 10:29:19 -08:00
|
|
|
"sync"
|
2023-01-24 14:31:20 -05:00
|
|
|
"sync/atomic"
|
2020-03-05 10:29:19 -08:00
|
|
|
"time"
|
|
|
|
|
2022-01-24 10:52:57 -08:00
|
|
|
"tailscale.com/envknob"
|
2023-01-24 14:31:20 -05:00
|
|
|
"tailscale.com/types/logger"
|
ipn/ipnlocal, net/dns*, util/cloudenv: specialize DNS config on Google Cloud
This does three things:
* If you're on GCP, it adds a *.internal DNS split route to the
metadata server, so we never break GCP DNS names. This lets people
have some Tailscale nodes on GCP and some not (e.g. laptops at home)
without having to add a Tailnet-wide *.internal DNS route.
If you already have such a route, though, it won't overwrite it.
* If the 100.100.100.100 DNS forwarder has nowhere to forward to,
it forwards it to the GCP metadata IP, which forwards to 8.8.8.8.
This means there are never errNoUpstreams ("upstream nameservers not set")
errors on GCP due to e.g. mangled /etc/resolv.conf (GCP default VMs
don't have systemd-resolved, so it's likely a DNS supremacy fight)
* makes the DNS fallback mechanism use the GCP metadata IP as a
fallback before our hosted HTTP-based fallbacks
I created a default GCP VM from their web wizard. It has no
systemd-resolved.
I then made its /etc/resolv.conf be empty and deleted its GCP
hostnames in /etc/hosts.
I then logged in to a tailnet with no global DNS settings.
With this, tailscaled writes /etc/resolv.conf (direct mode, as no
systemd-resolved) and sets it to 100.100.100.100, which then has
regular DNS via the metadata IP and *.internal DNS via the metadata IP
as well. If the tailnet configures explicit DNS servers, those are used
instead, except for *.internal.
This also adds a new util/cloudenv package based on version/distro
where the cloud type is only detected once. We'll likely expand it in
the future for other clouds, doing variants of this change for other
popular cloud environments.
Fixes #4911
RELNOTES=Google Cloud DNS improvements
Change-Id: I19f3c2075983669b2b2c0f29a548da8de373c7cf
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-06-29 13:19:34 -07:00
|
|
|
"tailscale.com/util/cloudenv"
|
2022-06-17 10:09:23 -07:00
|
|
|
"tailscale.com/util/singleflight"
|
2023-03-03 13:15:56 -05:00
|
|
|
"tailscale.com/util/slicesx"
|
2020-03-05 10:29:19 -08:00
|
|
|
)
|
|
|
|
|
2022-08-16 14:45:46 -04:00
|
|
|
var zaddr netip.Addr
|
|
|
|
|
2020-03-09 21:04:08 -07:00
|
|
|
var single = &Resolver{
|
|
|
|
Forward: &net.Resolver{PreferGo: preferGoResolver()},
|
|
|
|
}
|
2020-03-09 14:19:29 -04:00
|
|
|
|
2020-03-09 21:04:08 -07:00
|
|
|
func preferGoResolver() bool {
|
2020-03-09 14:19:29 -04:00
|
|
|
// There does not appear to be a local resolver running
|
|
|
|
// on iOS, and NetworkExtension is good at isolating DNS.
|
|
|
|
// So do not use the Go resolver on macOS/iOS.
|
2020-11-11 09:04:34 -08:00
|
|
|
if runtime.GOOS == "darwin" || runtime.GOOS == "ios" {
|
2020-03-09 21:04:08 -07:00
|
|
|
return false
|
2020-03-09 14:19:29 -04:00
|
|
|
}
|
|
|
|
|
2020-04-27 20:24:53 +02:00
|
|
|
// The local resolver is not available on Android.
|
|
|
|
if runtime.GOOS == "android" {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
2020-03-09 21:04:08 -07:00
|
|
|
// Otherwise, the Go resolver is fine and slightly preferred
|
|
|
|
// since it's lighter, not using cgo calls & threads.
|
|
|
|
return true
|
|
|
|
}
|
2020-03-05 10:29:19 -08:00
|
|
|
|
|
|
|
// Get returns a caching Resolver singleton.
|
|
|
|
func Get() *Resolver { return single }
|
|
|
|
|
|
|
|
// Resolver is a minimal DNS caching resolver.
|
|
|
|
//
|
|
|
|
// The TTL is always fixed for now. It's not intended for general use.
|
|
|
|
// Cache entries are never cleaned up so it's intended that this is
|
|
|
|
// only used with a fixed set of hostnames.
|
|
|
|
type Resolver struct {
|
|
|
|
// Forward is the resolver to use to populate the cache.
|
|
|
|
// If nil, net.DefaultResolver is used.
|
|
|
|
Forward *net.Resolver
|
|
|
|
|
2021-02-26 12:49:54 -08:00
|
|
|
// LookupIPFallback optionally provides a backup DNS mechanism
|
|
|
|
// to use if Forward returns an error or no results.
|
all: convert more code to use net/netip directly
perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
goimports -w .
Then delete some stuff from the net/netaddr shim package which is no
longer neeed.
Updates #5162
Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-07-25 21:14:09 -07:00
|
|
|
LookupIPFallback func(ctx context.Context, host string) ([]netip.Addr, error)
|
2021-02-26 12:49:54 -08:00
|
|
|
|
2020-11-11 12:37:53 -08:00
|
|
|
// TTL is how long to keep entries cached
|
|
|
|
//
|
|
|
|
// If zero, a default (currently 10 minutes) is used.
|
|
|
|
TTL time.Duration
|
|
|
|
|
|
|
|
// UseLastGood controls whether a cached entry older than TTL is used
|
|
|
|
// if a refresh fails.
|
|
|
|
UseLastGood bool
|
|
|
|
|
2022-04-18 12:50:26 -07:00
|
|
|
// SingleHostStaticResult, if non-nil, is the static result of IPs that is returned
|
|
|
|
// by Resolver.LookupIP for any hostname. When non-nil, SingleHost must also be
|
|
|
|
// set with the expected name.
|
all: convert more code to use net/netip directly
perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
goimports -w .
Then delete some stuff from the net/netaddr shim package which is no
longer neeed.
Updates #5162
Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-07-25 21:14:09 -07:00
|
|
|
SingleHostStaticResult []netip.Addr
|
2022-04-18 12:50:26 -07:00
|
|
|
|
|
|
|
// SingleHost is the hostname that SingleHostStaticResult is for.
|
|
|
|
// It is required when SingleHostStaticResult is present.
|
|
|
|
SingleHost string
|
|
|
|
|
2023-01-24 14:31:20 -05:00
|
|
|
// Logf optionally provides a log function to use for debug logs. If
|
|
|
|
// not present, log.Printf will be used. The prefix "dnscache: " will
|
|
|
|
// be added to all log messages printed with this logger.
|
|
|
|
Logf logger.Logf
|
|
|
|
|
2022-06-17 10:09:23 -07:00
|
|
|
sf singleflight.Group[string, ipRes]
|
2020-03-05 10:29:19 -08:00
|
|
|
|
|
|
|
mu sync.Mutex
|
|
|
|
ipCache map[string]ipCacheEntry
|
|
|
|
}
|
|
|
|
|
2022-06-17 10:09:23 -07:00
|
|
|
// ipRes is the type used by the Resolver.sf singleflight group.
|
|
|
|
type ipRes struct {
|
2022-08-16 14:45:46 -04:00
|
|
|
ip, ip6 netip.Addr
|
|
|
|
allIPs []netip.Addr
|
2022-06-17 10:09:23 -07:00
|
|
|
}
|
|
|
|
|
2020-03-05 10:29:19 -08:00
|
|
|
type ipCacheEntry struct {
|
2022-08-16 14:45:46 -04:00
|
|
|
ip netip.Addr // either v4 or v6
|
|
|
|
ip6 netip.Addr // nil if no v4 or no v6
|
|
|
|
allIPs []netip.Addr // 1+ v4 and/or v6
|
2020-03-05 10:29:19 -08:00
|
|
|
expires time.Time
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r *Resolver) fwd() *net.Resolver {
|
|
|
|
if r.Forward != nil {
|
|
|
|
return r.Forward
|
|
|
|
}
|
|
|
|
return net.DefaultResolver
|
|
|
|
}
|
|
|
|
|
2023-01-24 14:31:20 -05:00
|
|
|
// dlogf logs a debug message if debug logging is enabled either globally via
|
|
|
|
// the TS_DEBUG_DNS_CACHE environment variable or via the per-Resolver
|
|
|
|
// configuration.
|
|
|
|
func (r *Resolver) dlogf(format string, args ...any) {
|
|
|
|
logf := r.Logf
|
|
|
|
if logf == nil {
|
|
|
|
logf = log.Printf
|
|
|
|
}
|
|
|
|
|
|
|
|
if debug() || debugLogging.Load() {
|
|
|
|
logf("dnscache: "+format, args...)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
ipn/ipnlocal, net/dns*, util/cloudenv: specialize DNS config on Google Cloud
This does three things:
* If you're on GCP, it adds a *.internal DNS split route to the
metadata server, so we never break GCP DNS names. This lets people
have some Tailscale nodes on GCP and some not (e.g. laptops at home)
without having to add a Tailnet-wide *.internal DNS route.
If you already have such a route, though, it won't overwrite it.
* If the 100.100.100.100 DNS forwarder has nowhere to forward to,
it forwards it to the GCP metadata IP, which forwards to 8.8.8.8.
This means there are never errNoUpstreams ("upstream nameservers not set")
errors on GCP due to e.g. mangled /etc/resolv.conf (GCP default VMs
don't have systemd-resolved, so it's likely a DNS supremacy fight)
* makes the DNS fallback mechanism use the GCP metadata IP as a
fallback before our hosted HTTP-based fallbacks
I created a default GCP VM from their web wizard. It has no
systemd-resolved.
I then made its /etc/resolv.conf be empty and deleted its GCP
hostnames in /etc/hosts.
I then logged in to a tailnet with no global DNS settings.
With this, tailscaled writes /etc/resolv.conf (direct mode, as no
systemd-resolved) and sets it to 100.100.100.100, which then has
regular DNS via the metadata IP and *.internal DNS via the metadata IP
as well. If the tailnet configures explicit DNS servers, those are used
instead, except for *.internal.
This also adds a new util/cloudenv package based on version/distro
where the cloud type is only detected once. We'll likely expand it in
the future for other clouds, doing variants of this change for other
popular cloud environments.
Fixes #4911
RELNOTES=Google Cloud DNS improvements
Change-Id: I19f3c2075983669b2b2c0f29a548da8de373c7cf
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-06-29 13:19:34 -07:00
|
|
|
// cloudHostResolver returns a Resolver for the current cloud hosting environment.
|
|
|
|
// It currently only supports Google Cloud.
|
|
|
|
func (r *Resolver) cloudHostResolver() (v *net.Resolver, ok bool) {
|
|
|
|
switch runtime.GOOS {
|
|
|
|
case "android", "ios", "darwin":
|
|
|
|
return nil, false
|
|
|
|
}
|
2022-06-29 19:32:41 -07:00
|
|
|
ip := cloudenv.Get().ResolverIP()
|
|
|
|
if ip == "" {
|
ipn/ipnlocal, net/dns*, util/cloudenv: specialize DNS config on Google Cloud
This does three things:
* If you're on GCP, it adds a *.internal DNS split route to the
metadata server, so we never break GCP DNS names. This lets people
have some Tailscale nodes on GCP and some not (e.g. laptops at home)
without having to add a Tailnet-wide *.internal DNS route.
If you already have such a route, though, it won't overwrite it.
* If the 100.100.100.100 DNS forwarder has nowhere to forward to,
it forwards it to the GCP metadata IP, which forwards to 8.8.8.8.
This means there are never errNoUpstreams ("upstream nameservers not set")
errors on GCP due to e.g. mangled /etc/resolv.conf (GCP default VMs
don't have systemd-resolved, so it's likely a DNS supremacy fight)
* makes the DNS fallback mechanism use the GCP metadata IP as a
fallback before our hosted HTTP-based fallbacks
I created a default GCP VM from their web wizard. It has no
systemd-resolved.
I then made its /etc/resolv.conf be empty and deleted its GCP
hostnames in /etc/hosts.
I then logged in to a tailnet with no global DNS settings.
With this, tailscaled writes /etc/resolv.conf (direct mode, as no
systemd-resolved) and sets it to 100.100.100.100, which then has
regular DNS via the metadata IP and *.internal DNS via the metadata IP
as well. If the tailnet configures explicit DNS servers, those are used
instead, except for *.internal.
This also adds a new util/cloudenv package based on version/distro
where the cloud type is only detected once. We'll likely expand it in
the future for other clouds, doing variants of this change for other
popular cloud environments.
Fixes #4911
RELNOTES=Google Cloud DNS improvements
Change-Id: I19f3c2075983669b2b2c0f29a548da8de373c7cf
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-06-29 13:19:34 -07:00
|
|
|
return nil, false
|
|
|
|
}
|
|
|
|
return &net.Resolver{
|
|
|
|
PreferGo: true,
|
|
|
|
Dial: func(ctx context.Context, network, address string) (net.Conn, error) {
|
|
|
|
var d net.Dialer
|
2022-06-29 19:32:41 -07:00
|
|
|
return d.DialContext(ctx, network, net.JoinHostPort(ip, "53"))
|
ipn/ipnlocal, net/dns*, util/cloudenv: specialize DNS config on Google Cloud
This does three things:
* If you're on GCP, it adds a *.internal DNS split route to the
metadata server, so we never break GCP DNS names. This lets people
have some Tailscale nodes on GCP and some not (e.g. laptops at home)
without having to add a Tailnet-wide *.internal DNS route.
If you already have such a route, though, it won't overwrite it.
* If the 100.100.100.100 DNS forwarder has nowhere to forward to,
it forwards it to the GCP metadata IP, which forwards to 8.8.8.8.
This means there are never errNoUpstreams ("upstream nameservers not set")
errors on GCP due to e.g. mangled /etc/resolv.conf (GCP default VMs
don't have systemd-resolved, so it's likely a DNS supremacy fight)
* makes the DNS fallback mechanism use the GCP metadata IP as a
fallback before our hosted HTTP-based fallbacks
I created a default GCP VM from their web wizard. It has no
systemd-resolved.
I then made its /etc/resolv.conf be empty and deleted its GCP
hostnames in /etc/hosts.
I then logged in to a tailnet with no global DNS settings.
With this, tailscaled writes /etc/resolv.conf (direct mode, as no
systemd-resolved) and sets it to 100.100.100.100, which then has
regular DNS via the metadata IP and *.internal DNS via the metadata IP
as well. If the tailnet configures explicit DNS servers, those are used
instead, except for *.internal.
This also adds a new util/cloudenv package based on version/distro
where the cloud type is only detected once. We'll likely expand it in
the future for other clouds, doing variants of this change for other
popular cloud environments.
Fixes #4911
RELNOTES=Google Cloud DNS improvements
Change-Id: I19f3c2075983669b2b2c0f29a548da8de373c7cf
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-06-29 13:19:34 -07:00
|
|
|
},
|
|
|
|
}, true
|
|
|
|
}
|
|
|
|
|
2020-11-11 12:37:53 -08:00
|
|
|
func (r *Resolver) ttl() time.Duration {
|
|
|
|
if r.TTL > 0 {
|
|
|
|
return r.TTL
|
|
|
|
}
|
|
|
|
return 10 * time.Minute
|
|
|
|
}
|
|
|
|
|
2022-09-14 12:49:39 -07:00
|
|
|
var debug = envknob.RegisterBool("TS_DEBUG_DNS_CACHE")
|
2020-11-11 12:37:53 -08:00
|
|
|
|
2023-01-24 14:31:20 -05:00
|
|
|
// debugLogging allows enabling debug logging at runtime, via
|
|
|
|
// SetDebugLoggingEnabled.
|
|
|
|
//
|
|
|
|
// This is a global variable instead of a per-Resolver variable because we
|
|
|
|
// create new Resolvers throughout the lifetime of the program (e.g. on every
|
|
|
|
// new Direct client, etc.). When we enable debug logs, though, we want to do
|
|
|
|
// so for every single created Resolver; we'd need to plumb a bunch of new code
|
|
|
|
// through all of the intermediate packages to accomplish the same behaviour as
|
|
|
|
// just using a global variable.
|
|
|
|
var debugLogging atomic.Bool
|
|
|
|
|
|
|
|
// SetDebugLoggingEnabled controls whether debug logging is enabled for this
|
|
|
|
// package.
|
|
|
|
//
|
|
|
|
// These logs are also printed when the TS_DEBUG_DNS_CACHE envknob is set, but
|
|
|
|
// we allow configuring this manually as well so that it can be changed at
|
|
|
|
// runtime.
|
|
|
|
func SetDebugLoggingEnabled(v bool) {
|
|
|
|
debugLogging.Store(v)
|
|
|
|
}
|
|
|
|
|
2021-01-06 19:50:19 -08:00
|
|
|
// LookupIP returns the host's primary IP address (either IPv4 or
|
|
|
|
// IPv6, but preferring IPv4) and optionally its IPv6 address, if
|
|
|
|
// there is both IPv4 and IPv6.
|
|
|
|
//
|
|
|
|
// If err is nil, ip will be non-nil. The v6 address may be nil even
|
|
|
|
// with a nil error.
|
2022-08-16 14:45:46 -04:00
|
|
|
func (r *Resolver) LookupIP(ctx context.Context, host string) (ip, v6 netip.Addr, allIPs []netip.Addr, err error) {
|
2022-04-18 12:50:26 -07:00
|
|
|
if r.SingleHostStaticResult != nil {
|
|
|
|
if r.SingleHost != host {
|
2022-08-16 14:45:46 -04:00
|
|
|
return zaddr, zaddr, nil, fmt.Errorf("dnscache: unexpected hostname %q doesn't match expected %q", host, r.SingleHost)
|
2022-04-18 12:50:26 -07:00
|
|
|
}
|
|
|
|
for _, naIP := range r.SingleHostStaticResult {
|
2022-08-16 14:45:46 -04:00
|
|
|
if !ip.IsValid() && naIP.Is4() {
|
|
|
|
ip = naIP
|
2022-04-18 12:50:26 -07:00
|
|
|
}
|
2022-08-16 14:45:46 -04:00
|
|
|
if !v6.IsValid() && naIP.Is6() {
|
|
|
|
v6 = naIP
|
2022-04-18 12:50:26 -07:00
|
|
|
}
|
2022-08-16 14:45:46 -04:00
|
|
|
allIPs = append(allIPs, naIP)
|
2022-04-18 12:50:26 -07:00
|
|
|
}
|
2023-01-24 14:31:20 -05:00
|
|
|
r.dlogf("returning %d static results", len(allIPs))
|
2022-04-18 12:50:26 -07:00
|
|
|
return
|
|
|
|
}
|
2022-08-16 14:45:46 -04:00
|
|
|
if ip, err := netip.ParseAddr(host); err == nil {
|
|
|
|
ip = ip.Unmap()
|
2023-01-24 14:31:20 -05:00
|
|
|
r.dlogf("%q is an IP", host)
|
2022-08-16 14:45:46 -04:00
|
|
|
return ip, zaddr, []netip.Addr{ip}, nil
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
|
|
|
|
2021-07-26 11:58:28 -07:00
|
|
|
if ip, ip6, allIPs, ok := r.lookupIPCache(host); ok {
|
2023-01-24 14:31:20 -05:00
|
|
|
r.dlogf("%q = %v (cached)", host, ip)
|
2021-07-26 11:58:28 -07:00
|
|
|
return ip, ip6, allIPs, nil
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
|
|
|
|
2022-06-17 10:09:23 -07:00
|
|
|
ch := r.sf.DoChan(host, func() (ret ipRes, _ error) {
|
2021-07-26 11:58:28 -07:00
|
|
|
ip, ip6, allIPs, err := r.lookupIP(host)
|
2020-03-05 10:29:19 -08:00
|
|
|
if err != nil {
|
2022-06-17 10:09:23 -07:00
|
|
|
return ret, err
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
2021-07-26 11:58:28 -07:00
|
|
|
return ipRes{ip, ip6, allIPs}, nil
|
2020-03-05 10:29:19 -08:00
|
|
|
})
|
|
|
|
select {
|
|
|
|
case res := <-ch:
|
|
|
|
if res.Err != nil {
|
2020-11-11 12:37:53 -08:00
|
|
|
if r.UseLastGood {
|
2021-07-26 11:58:28 -07:00
|
|
|
if ip, ip6, allIPs, ok := r.lookupIPCacheExpired(host); ok {
|
2023-01-24 14:31:20 -05:00
|
|
|
r.dlogf("%q using %v after error", host, ip)
|
2021-07-26 11:58:28 -07:00
|
|
|
return ip, ip6, allIPs, nil
|
2020-11-11 12:37:53 -08:00
|
|
|
}
|
|
|
|
}
|
2023-01-24 14:31:20 -05:00
|
|
|
r.dlogf("error resolving %q: %v", host, res.Err)
|
2022-08-16 14:45:46 -04:00
|
|
|
return zaddr, zaddr, nil, res.Err
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
2022-06-17 10:09:23 -07:00
|
|
|
r := res.Val
|
2021-07-26 11:58:28 -07:00
|
|
|
return r.ip, r.ip6, r.allIPs, nil
|
2020-03-05 10:29:19 -08:00
|
|
|
case <-ctx.Done():
|
2023-01-24 14:31:20 -05:00
|
|
|
r.dlogf("context done while resolving %q: %v", host, ctx.Err())
|
2022-08-16 14:45:46 -04:00
|
|
|
return zaddr, zaddr, nil, ctx.Err()
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-08-16 14:45:46 -04:00
|
|
|
func (r *Resolver) lookupIPCache(host string) (ip, ip6 netip.Addr, allIPs []netip.Addr, ok bool) {
|
2020-03-05 10:29:19 -08:00
|
|
|
r.mu.Lock()
|
|
|
|
defer r.mu.Unlock()
|
|
|
|
if ent, ok := r.ipCache[host]; ok && ent.expires.After(time.Now()) {
|
2021-07-26 11:58:28 -07:00
|
|
|
return ent.ip, ent.ip6, ent.allIPs, true
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
2022-08-16 14:45:46 -04:00
|
|
|
return zaddr, zaddr, nil, false
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
|
|
|
|
2022-08-16 14:45:46 -04:00
|
|
|
func (r *Resolver) lookupIPCacheExpired(host string) (ip, ip6 netip.Addr, allIPs []netip.Addr, ok bool) {
|
2020-11-11 12:37:53 -08:00
|
|
|
r.mu.Lock()
|
|
|
|
defer r.mu.Unlock()
|
|
|
|
if ent, ok := r.ipCache[host]; ok {
|
2021-07-26 11:58:28 -07:00
|
|
|
return ent.ip, ent.ip6, ent.allIPs, true
|
2020-11-11 12:37:53 -08:00
|
|
|
}
|
2022-08-16 14:45:46 -04:00
|
|
|
return zaddr, zaddr, nil, false
|
2020-11-11 12:37:53 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
func (r *Resolver) lookupTimeoutForHost(host string) time.Duration {
|
|
|
|
if r.UseLastGood {
|
2021-07-26 11:58:28 -07:00
|
|
|
if _, _, _, ok := r.lookupIPCacheExpired(host); ok {
|
2020-11-11 12:37:53 -08:00
|
|
|
// If we have some previous good value for this host,
|
|
|
|
// don't give this DNS lookup much time. If we're in a
|
|
|
|
// situation where the user's DNS server is unreachable
|
|
|
|
// (e.g. their corp DNS server is behind a subnet router
|
|
|
|
// that can't come up due to Tailscale needing to
|
|
|
|
// connect to itself), then we want to fail fast and let
|
|
|
|
// our caller (who set UseLastGood) fall back to using
|
|
|
|
// the last-known-good IP address.
|
|
|
|
return 3 * time.Second
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return 10 * time.Second
|
|
|
|
}
|
|
|
|
|
2022-08-16 14:45:46 -04:00
|
|
|
func (r *Resolver) lookupIP(host string) (ip, ip6 netip.Addr, allIPs []netip.Addr, err error) {
|
2021-07-26 11:58:28 -07:00
|
|
|
if ip, ip6, allIPs, ok := r.lookupIPCache(host); ok {
|
2023-01-24 14:31:20 -05:00
|
|
|
r.dlogf("%q found in cache as %v", host, ip)
|
2021-07-26 11:58:28 -07:00
|
|
|
return ip, ip6, allIPs, nil
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
|
|
|
|
2020-11-11 12:37:53 -08:00
|
|
|
ctx, cancel := context.WithTimeout(context.Background(), r.lookupTimeoutForHost(host))
|
2020-03-05 10:29:19 -08:00
|
|
|
defer cancel()
|
2022-08-16 14:45:46 -04:00
|
|
|
ips, err := r.fwd().LookupNetIP(ctx, "ip", host)
|
ipn/ipnlocal, net/dns*, util/cloudenv: specialize DNS config on Google Cloud
This does three things:
* If you're on GCP, it adds a *.internal DNS split route to the
metadata server, so we never break GCP DNS names. This lets people
have some Tailscale nodes on GCP and some not (e.g. laptops at home)
without having to add a Tailnet-wide *.internal DNS route.
If you already have such a route, though, it won't overwrite it.
* If the 100.100.100.100 DNS forwarder has nowhere to forward to,
it forwards it to the GCP metadata IP, which forwards to 8.8.8.8.
This means there are never errNoUpstreams ("upstream nameservers not set")
errors on GCP due to e.g. mangled /etc/resolv.conf (GCP default VMs
don't have systemd-resolved, so it's likely a DNS supremacy fight)
* makes the DNS fallback mechanism use the GCP metadata IP as a
fallback before our hosted HTTP-based fallbacks
I created a default GCP VM from their web wizard. It has no
systemd-resolved.
I then made its /etc/resolv.conf be empty and deleted its GCP
hostnames in /etc/hosts.
I then logged in to a tailnet with no global DNS settings.
With this, tailscaled writes /etc/resolv.conf (direct mode, as no
systemd-resolved) and sets it to 100.100.100.100, which then has
regular DNS via the metadata IP and *.internal DNS via the metadata IP
as well. If the tailnet configures explicit DNS servers, those are used
instead, except for *.internal.
This also adds a new util/cloudenv package based on version/distro
where the cloud type is only detected once. We'll likely expand it in
the future for other clouds, doing variants of this change for other
popular cloud environments.
Fixes #4911
RELNOTES=Google Cloud DNS improvements
Change-Id: I19f3c2075983669b2b2c0f29a548da8de373c7cf
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-06-29 13:19:34 -07:00
|
|
|
if err != nil || len(ips) == 0 {
|
|
|
|
if resolver, ok := r.cloudHostResolver(); ok {
|
2023-01-24 14:31:20 -05:00
|
|
|
r.dlogf("resolving %q via cloud resolver", host)
|
2022-08-16 14:45:46 -04:00
|
|
|
ips, err = resolver.LookupNetIP(ctx, "ip", host)
|
ipn/ipnlocal, net/dns*, util/cloudenv: specialize DNS config on Google Cloud
This does three things:
* If you're on GCP, it adds a *.internal DNS split route to the
metadata server, so we never break GCP DNS names. This lets people
have some Tailscale nodes on GCP and some not (e.g. laptops at home)
without having to add a Tailnet-wide *.internal DNS route.
If you already have such a route, though, it won't overwrite it.
* If the 100.100.100.100 DNS forwarder has nowhere to forward to,
it forwards it to the GCP metadata IP, which forwards to 8.8.8.8.
This means there are never errNoUpstreams ("upstream nameservers not set")
errors on GCP due to e.g. mangled /etc/resolv.conf (GCP default VMs
don't have systemd-resolved, so it's likely a DNS supremacy fight)
* makes the DNS fallback mechanism use the GCP metadata IP as a
fallback before our hosted HTTP-based fallbacks
I created a default GCP VM from their web wizard. It has no
systemd-resolved.
I then made its /etc/resolv.conf be empty and deleted its GCP
hostnames in /etc/hosts.
I then logged in to a tailnet with no global DNS settings.
With this, tailscaled writes /etc/resolv.conf (direct mode, as no
systemd-resolved) and sets it to 100.100.100.100, which then has
regular DNS via the metadata IP and *.internal DNS via the metadata IP
as well. If the tailnet configures explicit DNS servers, those are used
instead, except for *.internal.
This also adds a new util/cloudenv package based on version/distro
where the cloud type is only detected once. We'll likely expand it in
the future for other clouds, doing variants of this change for other
popular cloud environments.
Fixes #4911
RELNOTES=Google Cloud DNS improvements
Change-Id: I19f3c2075983669b2b2c0f29a548da8de373c7cf
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-06-29 13:19:34 -07:00
|
|
|
}
|
|
|
|
}
|
2021-02-26 12:49:54 -08:00
|
|
|
if (err != nil || len(ips) == 0) && r.LookupIPFallback != nil {
|
|
|
|
ctx, cancel := context.WithTimeout(context.Background(), 30*time.Second)
|
|
|
|
defer cancel()
|
2023-01-24 14:31:20 -05:00
|
|
|
if err != nil {
|
|
|
|
r.dlogf("resolving %q using fallback resolver due to error", host)
|
|
|
|
} else {
|
|
|
|
r.dlogf("resolving %q using fallback resolver due to no returned IPs", host)
|
|
|
|
}
|
2022-08-16 14:45:46 -04:00
|
|
|
ips, err = r.LookupIPFallback(ctx, host)
|
2021-02-26 12:49:54 -08:00
|
|
|
}
|
2020-03-05 10:29:19 -08:00
|
|
|
if err != nil {
|
2022-08-16 14:45:46 -04:00
|
|
|
return netip.Addr{}, netip.Addr{}, nil, err
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
|
|
|
if len(ips) == 0 {
|
2022-08-16 14:45:46 -04:00
|
|
|
return netip.Addr{}, netip.Addr{}, nil, fmt.Errorf("no IPs for %q found", host)
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
|
|
|
|
2022-12-09 15:12:20 -08:00
|
|
|
// Unmap everything; LookupNetIP can return mapped addresses (see #5698)
|
2022-10-22 15:55:59 -04:00
|
|
|
for i := range ips {
|
|
|
|
ips[i] = ips[i].Unmap()
|
|
|
|
}
|
|
|
|
|
2021-01-06 19:50:19 -08:00
|
|
|
have4 := false
|
2020-03-05 10:29:19 -08:00
|
|
|
for _, ipa := range ips {
|
2022-08-16 14:45:46 -04:00
|
|
|
if ipa.Is4() {
|
2021-01-06 19:50:19 -08:00
|
|
|
if !have4 {
|
|
|
|
ip6 = ip
|
2022-08-16 14:45:46 -04:00
|
|
|
ip = ipa
|
2021-01-06 19:50:19 -08:00
|
|
|
have4 = true
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if have4 {
|
2022-08-16 14:45:46 -04:00
|
|
|
ip6 = ipa
|
2021-01-06 19:50:19 -08:00
|
|
|
} else {
|
2022-08-16 14:45:46 -04:00
|
|
|
ip = ipa
|
2021-01-06 19:50:19 -08:00
|
|
|
}
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
|
|
|
}
|
2021-07-26 11:58:28 -07:00
|
|
|
r.addIPCache(host, ip, ip6, ips, r.ttl())
|
|
|
|
return ip, ip6, ips, nil
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
|
|
|
|
2022-08-16 14:45:46 -04:00
|
|
|
func (r *Resolver) addIPCache(host string, ip, ip6 netip.Addr, allIPs []netip.Addr, d time.Duration) {
|
2022-08-02 13:38:11 -07:00
|
|
|
if ip.IsPrivate() {
|
2020-03-05 10:29:19 -08:00
|
|
|
// Don't cache obviously wrong entries from captive portals.
|
|
|
|
// TODO: use DoH or DoT for the forwarding resolver?
|
2023-01-24 14:31:20 -05:00
|
|
|
r.dlogf("%q resolved to private IP %v; using but not caching", host, ip)
|
2021-01-06 19:50:19 -08:00
|
|
|
return
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
|
|
|
|
2023-01-24 14:31:20 -05:00
|
|
|
r.dlogf("%q resolved to IP %v; caching", host, ip)
|
2020-11-11 12:37:53 -08:00
|
|
|
|
2020-03-05 10:29:19 -08:00
|
|
|
r.mu.Lock()
|
|
|
|
defer r.mu.Unlock()
|
|
|
|
if r.ipCache == nil {
|
|
|
|
r.ipCache = make(map[string]ipCacheEntry)
|
|
|
|
}
|
2021-07-26 11:58:28 -07:00
|
|
|
r.ipCache[host] = ipCacheEntry{
|
|
|
|
ip: ip,
|
|
|
|
ip6: ip6,
|
|
|
|
allIPs: allIPs,
|
|
|
|
expires: time.Now().Add(d),
|
|
|
|
}
|
2020-03-05 10:29:19 -08:00
|
|
|
}
|
|
|
|
|
2020-11-11 12:37:53 -08:00
|
|
|
type DialContextFunc func(ctx context.Context, network, address string) (net.Conn, error)
|
|
|
|
|
|
|
|
// Dialer returns a wrapped DialContext func that uses the provided dnsCache.
|
|
|
|
func Dialer(fwd DialContextFunc, dnsCache *Resolver) DialContextFunc {
|
2022-02-14 09:38:23 -08:00
|
|
|
d := &dialer{
|
2022-02-14 13:25:19 -08:00
|
|
|
fwd: fwd,
|
|
|
|
dnsCache: dnsCache,
|
all: convert more code to use net/netip directly
perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
goimports -w .
Then delete some stuff from the net/netaddr shim package which is no
longer neeed.
Updates #5162
Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-07-25 21:14:09 -07:00
|
|
|
pastConnect: map[netip.Addr]time.Time{},
|
2022-02-14 09:38:23 -08:00
|
|
|
}
|
|
|
|
return d.DialContext
|
|
|
|
}
|
|
|
|
|
|
|
|
// dialer is the config and accumulated state for a dial func returned by Dialer.
|
|
|
|
type dialer struct {
|
|
|
|
fwd DialContextFunc
|
|
|
|
dnsCache *Resolver
|
2022-02-14 13:25:19 -08:00
|
|
|
|
|
|
|
mu sync.Mutex
|
all: convert more code to use net/netip directly
perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
goimports -w .
Then delete some stuff from the net/netaddr shim package which is no
longer neeed.
Updates #5162
Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-07-25 21:14:09 -07:00
|
|
|
pastConnect map[netip.Addr]time.Time
|
2022-02-14 09:38:23 -08:00
|
|
|
}
|
2021-02-26 12:49:54 -08:00
|
|
|
|
2022-02-14 09:38:23 -08:00
|
|
|
func (d *dialer) DialContext(ctx context.Context, network, address string) (retConn net.Conn, ret error) {
|
|
|
|
host, port, err := net.SplitHostPort(address)
|
|
|
|
if err != nil {
|
|
|
|
// Bogus. But just let the real dialer return an error rather than
|
|
|
|
// inventing a similar one.
|
|
|
|
return d.fwd(ctx, network, address)
|
|
|
|
}
|
|
|
|
dc := &dialCall{
|
|
|
|
d: d,
|
|
|
|
network: network,
|
|
|
|
address: address,
|
|
|
|
host: host,
|
|
|
|
port: port,
|
|
|
|
}
|
|
|
|
defer func() {
|
2022-02-14 13:25:19 -08:00
|
|
|
// On failure, consider that our DNS might be wrong and ask the DNS fallback mechanism for
|
|
|
|
// some other IPs to try.
|
2022-09-15 10:41:45 -04:00
|
|
|
if !d.shouldTryBootstrap(ctx, ret, dc) {
|
2022-02-14 09:38:23 -08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
ips, err := d.dnsCache.LookupIPFallback(ctx, host)
|
2020-11-11 12:37:53 -08:00
|
|
|
if err != nil {
|
2022-02-14 09:38:23 -08:00
|
|
|
// Return with original error
|
|
|
|
return
|
2020-11-11 12:37:53 -08:00
|
|
|
}
|
2022-02-14 09:38:23 -08:00
|
|
|
if c, err := dc.raceDial(ctx, ips); err == nil {
|
|
|
|
retConn = c
|
|
|
|
ret = nil
|
|
|
|
return
|
2021-07-26 14:36:21 -07:00
|
|
|
}
|
2022-02-14 09:38:23 -08:00
|
|
|
}()
|
2021-07-26 14:36:21 -07:00
|
|
|
|
2022-02-14 09:38:23 -08:00
|
|
|
ip, ip6, allIPs, err := d.dnsCache.LookupIP(ctx, host)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to resolve %q: %w", host, err)
|
|
|
|
}
|
|
|
|
i4s := v4addrs(allIPs)
|
|
|
|
if len(i4s) < 2 {
|
2023-01-24 14:31:20 -05:00
|
|
|
d.dnsCache.dlogf("dialing %s, %s for %s", network, ip, address)
|
2022-08-16 14:45:46 -04:00
|
|
|
c, err := dc.dialOne(ctx, ip.Unmap())
|
2022-02-14 13:25:19 -08:00
|
|
|
if err == nil || ctx.Err() != nil {
|
2022-02-14 09:38:23 -08:00
|
|
|
return c, err
|
|
|
|
}
|
2022-02-14 13:25:19 -08:00
|
|
|
// Fall back to trying IPv6, if any.
|
2022-08-16 14:45:46 -04:00
|
|
|
return dc.dialOne(ctx, ip6)
|
2021-07-26 14:36:21 -07:00
|
|
|
}
|
2022-02-14 09:38:23 -08:00
|
|
|
|
|
|
|
// Multiple IPv4 candidates, and 0+ IPv6.
|
|
|
|
ipsToTry := append(i4s, v6addrs(allIPs)...)
|
|
|
|
return dc.raceDial(ctx, ipsToTry)
|
|
|
|
}
|
|
|
|
|
2022-09-15 10:41:45 -04:00
|
|
|
func (d *dialer) shouldTryBootstrap(ctx context.Context, err error, dc *dialCall) bool {
|
|
|
|
// No need to do anything when we succeeded.
|
|
|
|
if err == nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
// Can't try bootstrap DNS if we don't have a fallback function
|
|
|
|
if d.dnsCache.LookupIPFallback == nil {
|
2023-01-24 14:31:20 -05:00
|
|
|
d.dnsCache.dlogf("not using bootstrap DNS: no fallback")
|
2022-09-15 10:41:45 -04:00
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
// We can't retry if the context is canceled, since any further
|
|
|
|
// operations with this context will fail.
|
|
|
|
if ctxErr := ctx.Err(); ctxErr != nil {
|
2023-01-24 14:31:20 -05:00
|
|
|
d.dnsCache.dlogf("not using bootstrap DNS: context error: %v", ctxErr)
|
2022-09-15 10:41:45 -04:00
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
wasTrustworthy := dc.dnsWasTrustworthy()
|
|
|
|
if wasTrustworthy {
|
2023-01-24 14:31:20 -05:00
|
|
|
d.dnsCache.dlogf("not using bootstrap DNS: DNS was trustworthy")
|
2022-09-15 10:41:45 -04:00
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
2022-02-14 09:38:23 -08:00
|
|
|
// dialCall is the state around a single call to dial.
|
|
|
|
type dialCall struct {
|
|
|
|
d *dialer
|
|
|
|
network, address, host, port string
|
2022-02-14 13:25:19 -08:00
|
|
|
|
|
|
|
mu sync.Mutex // lock ordering: dialer.mu, then dialCall.mu
|
all: convert more code to use net/netip directly
perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
goimports -w .
Then delete some stuff from the net/netaddr shim package which is no
longer neeed.
Updates #5162
Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-07-25 21:14:09 -07:00
|
|
|
fails map[netip.Addr]error // set of IPs that failed to dial thus far
|
2022-02-14 13:25:19 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
// dnsWasTrustworthy reports whether we think the IP address(es) we
|
|
|
|
// tried (and failed) to dial were probably the correct IPs. Currently
|
|
|
|
// the heuristic is whether they ever worked previously.
|
|
|
|
func (dc *dialCall) dnsWasTrustworthy() bool {
|
|
|
|
dc.d.mu.Lock()
|
|
|
|
defer dc.d.mu.Unlock()
|
|
|
|
dc.mu.Lock()
|
|
|
|
defer dc.mu.Unlock()
|
|
|
|
|
|
|
|
if len(dc.fails) == 0 {
|
|
|
|
// No information.
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
// If any of the IPs we failed to dial worked previously in
|
|
|
|
// this dialer, assume the DNS is fine.
|
|
|
|
for ip := range dc.fails {
|
|
|
|
if _, ok := dc.d.pastConnect[ip]; ok {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
all: convert more code to use net/netip directly
perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
goimports -w .
Then delete some stuff from the net/netaddr shim package which is no
longer neeed.
Updates #5162
Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-07-25 21:14:09 -07:00
|
|
|
func (dc *dialCall) dialOne(ctx context.Context, ip netip.Addr) (net.Conn, error) {
|
2022-02-14 13:25:19 -08:00
|
|
|
c, err := dc.d.fwd(ctx, dc.network, net.JoinHostPort(ip.String(), dc.port))
|
|
|
|
dc.noteDialResult(ip, err)
|
|
|
|
return c, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// noteDialResult records that a dial to ip either succeeded or
|
|
|
|
// failed.
|
all: convert more code to use net/netip directly
perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
goimports -w .
Then delete some stuff from the net/netaddr shim package which is no
longer neeed.
Updates #5162
Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-07-25 21:14:09 -07:00
|
|
|
func (dc *dialCall) noteDialResult(ip netip.Addr, err error) {
|
2022-02-14 13:25:19 -08:00
|
|
|
if err == nil {
|
|
|
|
d := dc.d
|
|
|
|
d.mu.Lock()
|
|
|
|
defer d.mu.Unlock()
|
|
|
|
d.pastConnect[ip] = time.Now()
|
|
|
|
return
|
|
|
|
}
|
|
|
|
dc.mu.Lock()
|
|
|
|
defer dc.mu.Unlock()
|
|
|
|
if dc.fails == nil {
|
all: convert more code to use net/netip directly
perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
goimports -w .
Then delete some stuff from the net/netaddr shim package which is no
longer neeed.
Updates #5162
Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-07-25 21:14:09 -07:00
|
|
|
dc.fails = map[netip.Addr]error{}
|
2022-02-14 13:25:19 -08:00
|
|
|
}
|
|
|
|
dc.fails[ip] = err
|
|
|
|
}
|
|
|
|
|
|
|
|
// uniqueIPs returns a possibly-mutated subslice of ips, filtering out
|
|
|
|
// dups and ones that have already failed previously.
|
all: convert more code to use net/netip directly
perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
goimports -w .
Then delete some stuff from the net/netaddr shim package which is no
longer neeed.
Updates #5162
Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-07-25 21:14:09 -07:00
|
|
|
func (dc *dialCall) uniqueIPs(ips []netip.Addr) (ret []netip.Addr) {
|
2022-02-14 13:25:19 -08:00
|
|
|
dc.mu.Lock()
|
|
|
|
defer dc.mu.Unlock()
|
all: convert more code to use net/netip directly
perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
goimports -w .
Then delete some stuff from the net/netaddr shim package which is no
longer neeed.
Updates #5162
Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-07-25 21:14:09 -07:00
|
|
|
seen := map[netip.Addr]bool{}
|
2022-02-14 13:25:19 -08:00
|
|
|
ret = ips[:0]
|
|
|
|
for _, ip := range ips {
|
|
|
|
if seen[ip] {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
seen[ip] = true
|
|
|
|
if dc.fails[ip] != nil {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
ret = append(ret, ip)
|
|
|
|
}
|
|
|
|
return ret
|
2021-07-26 14:36:21 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// fallbackDelay is how long to wait between trying subsequent
|
|
|
|
// addresses when multiple options are available.
|
|
|
|
// 300ms is the same as Go's Happy Eyeballs fallbackDelay value.
|
|
|
|
const fallbackDelay = 300 * time.Millisecond
|
|
|
|
|
|
|
|
// raceDial tries to dial port on each ip in ips, starting a new race
|
2021-07-26 16:16:08 -07:00
|
|
|
// dial every fallbackDelay apart, returning whichever completes first.
|
all: convert more code to use net/netip directly
perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
goimports -w .
Then delete some stuff from the net/netaddr shim package which is no
longer neeed.
Updates #5162
Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-07-25 21:14:09 -07:00
|
|
|
func (dc *dialCall) raceDial(ctx context.Context, ips []netip.Addr) (net.Conn, error) {
|
2021-07-26 14:36:21 -07:00
|
|
|
ctx, cancel := context.WithCancel(ctx)
|
|
|
|
defer cancel()
|
|
|
|
|
|
|
|
type res struct {
|
|
|
|
c net.Conn
|
|
|
|
err error
|
|
|
|
}
|
|
|
|
resc := make(chan res) // must be unbuffered
|
|
|
|
failBoost := make(chan struct{}) // best effort send on dial failure
|
|
|
|
|
2022-02-14 13:25:19 -08:00
|
|
|
// Remove IPs that we tried & failed to dial previously
|
|
|
|
// (such as when we're being called after a dnsfallback lookup and get
|
|
|
|
// the same results)
|
|
|
|
ips = dc.uniqueIPs(ips)
|
|
|
|
if len(ips) == 0 {
|
|
|
|
return nil, errors.New("no IPs")
|
|
|
|
}
|
|
|
|
|
2022-08-11 19:00:39 -04:00
|
|
|
// Partition candidate list and then merge such that an IPv6 address is
|
|
|
|
// in the first spot if present, and then addresses are interleaved.
|
|
|
|
// This ensures that we're trying an IPv6 address first, then
|
|
|
|
// alternating between v4 and v6 in case one of the two networks is
|
|
|
|
// broken.
|
|
|
|
var iv4, iv6 []netip.Addr
|
|
|
|
for _, ip := range ips {
|
|
|
|
if ip.Is6() {
|
|
|
|
iv6 = append(iv6, ip)
|
|
|
|
} else {
|
|
|
|
iv4 = append(iv4, ip)
|
|
|
|
}
|
|
|
|
}
|
2023-03-03 13:15:56 -05:00
|
|
|
ips = slicesx.Interleave(iv6, iv4)
|
2022-08-11 19:00:39 -04:00
|
|
|
|
2021-07-26 14:36:21 -07:00
|
|
|
go func() {
|
|
|
|
for i, ip := range ips {
|
|
|
|
if i != 0 {
|
|
|
|
timer := time.NewTimer(fallbackDelay)
|
|
|
|
select {
|
|
|
|
case <-timer.C:
|
|
|
|
case <-failBoost:
|
|
|
|
timer.Stop()
|
|
|
|
case <-ctx.Done():
|
|
|
|
timer.Stop()
|
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
all: convert more code to use net/netip directly
perl -i -npe 's,netaddr.IPPrefixFrom,netip.PrefixFrom,' $(git grep -l -F netaddr.)
perl -i -npe 's,netaddr.IPPortFrom,netip.AddrPortFrom,' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPrefix,netip.Prefix,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPPort,netip.AddrPort,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IP\b,netip.Addr,g' $(git grep -l -F netaddr. )
perl -i -npe 's,netaddr.IPv6Raw\b,netip.AddrFrom16,g' $(git grep -l -F netaddr. )
goimports -w .
Then delete some stuff from the net/netaddr shim package which is no
longer neeed.
Updates #5162
Change-Id: Ia7a86893fe21c7e3ee1ec823e8aba288d4566cd8
Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
2022-07-25 21:14:09 -07:00
|
|
|
go func(ip netip.Addr) {
|
2022-02-14 13:25:19 -08:00
|
|
|
c, err := dc.dialOne(ctx, ip)
|
2021-07-26 14:36:21 -07:00
|
|
|
if err != nil {
|
|
|
|
// Best effort wake-up a pending dial.
|
|
|
|
// e.g. IPv4 dials failing quickly on an IPv6-only system.
|
|
|
|
// In that case we don't want to wait 300ms per IPv4 before
|
|
|
|
// we get to the IPv6 addresses.
|
|
|
|
select {
|
|
|
|
case failBoost <- struct{}{}:
|
|
|
|
default:
|
|
|
|
}
|
|
|
|
}
|
|
|
|
select {
|
|
|
|
case resc <- res{c, err}:
|
|
|
|
case <-ctx.Done():
|
|
|
|
if c != nil {
|
|
|
|
c.Close()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}(ip)
|
2020-11-11 12:37:53 -08:00
|
|
|
}
|
2021-07-26 14:36:21 -07:00
|
|
|
}()
|
|
|
|
|
|
|
|
var firstErr error
|
|
|
|
var fails int
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case r := <-resc:
|
|
|
|
if r.c != nil {
|
|
|
|
return r.c, nil
|
|
|
|
}
|
|
|
|
fails++
|
|
|
|
if firstErr == nil {
|
|
|
|
firstErr = r.err
|
|
|
|
}
|
|
|
|
if fails == len(ips) {
|
|
|
|
return nil, firstErr
|
|
|
|
}
|
|
|
|
case <-ctx.Done():
|
|
|
|
return nil, ctx.Err()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-08-16 14:45:46 -04:00
|
|
|
func v4addrs(aa []netip.Addr) (ret []netip.Addr) {
|
2021-07-26 14:36:21 -07:00
|
|
|
for _, a := range aa {
|
2022-08-16 14:45:46 -04:00
|
|
|
a = a.Unmap()
|
|
|
|
if a.Is4() {
|
|
|
|
ret = append(ret, a)
|
2021-07-26 14:36:21 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return ret
|
|
|
|
}
|
|
|
|
|
2022-08-16 14:45:46 -04:00
|
|
|
func v6addrs(aa []netip.Addr) (ret []netip.Addr) {
|
2021-07-26 14:36:21 -07:00
|
|
|
for _, a := range aa {
|
2022-08-16 14:45:46 -04:00
|
|
|
if a.Is6() && !a.Is4In6() {
|
|
|
|
ret = append(ret, a)
|
2021-01-06 19:50:19 -08:00
|
|
|
}
|
2020-11-11 12:37:53 -08:00
|
|
|
}
|
2021-07-26 14:36:21 -07:00
|
|
|
return ret
|
2020-11-11 12:37:53 -08:00
|
|
|
}
|
2021-02-26 12:49:54 -08:00
|
|
|
|
|
|
|
// TLSDialer is like Dialer but returns a func suitable for using with net/http.Transport.DialTLSContext.
|
|
|
|
// It returns a *tls.Conn type on success.
|
|
|
|
// On TLS cert validation failure, it can invoke a backup DNS resolution strategy.
|
|
|
|
func TLSDialer(fwd DialContextFunc, dnsCache *Resolver, tlsConfigBase *tls.Config) DialContextFunc {
|
|
|
|
tcpDialer := Dialer(fwd, dnsCache)
|
|
|
|
return func(ctx context.Context, network, address string) (net.Conn, error) {
|
|
|
|
host, _, err := net.SplitHostPort(address)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
tcpConn, err := tcpDialer(ctx, network, address)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
cfg := cloneTLSConfig(tlsConfigBase)
|
|
|
|
if cfg.ServerName == "" {
|
|
|
|
cfg.ServerName = host
|
|
|
|
}
|
|
|
|
tlsConn := tls.Client(tcpConn, cfg)
|
|
|
|
|
|
|
|
handshakeCtx, handshakeTimeoutCancel := context.WithTimeout(ctx, 5*time.Second)
|
|
|
|
defer handshakeTimeoutCancel()
|
2022-01-13 13:01:29 -08:00
|
|
|
if err := tlsConn.HandshakeContext(handshakeCtx); err != nil {
|
2021-02-26 12:49:54 -08:00
|
|
|
tcpConn.Close()
|
|
|
|
// TODO: if err != errTLSHandshakeTimeout,
|
|
|
|
// assume it might be some captive portal or
|
|
|
|
// otherwise incorrect DNS and try the backup
|
|
|
|
// DNS mechanism.
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return tlsConn, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func cloneTLSConfig(cfg *tls.Config) *tls.Config {
|
|
|
|
if cfg == nil {
|
|
|
|
return &tls.Config{}
|
|
|
|
}
|
|
|
|
return cfg.Clone()
|
|
|
|
}
|