2020-02-05 14:16:58 -08:00
|
|
|
// Copyright (c) 2020 Tailscale Inc & AUTHORS All rights reserved.
|
|
|
|
// Use of this source code is governed by a BSD-style
|
|
|
|
// license that can be found in the LICENSE file.
|
|
|
|
|
2020-03-25 08:40:36 -07:00
|
|
|
// Package filter contains a stateful packet filter.
|
2020-02-05 14:16:58 -08:00
|
|
|
package filter
|
|
|
|
|
|
|
|
import (
|
|
|
|
"sync"
|
|
|
|
"time"
|
|
|
|
|
|
|
|
"github.com/golang/groupcache/lru"
|
2020-05-08 12:30:22 -06:00
|
|
|
"golang.org/x/time/rate"
|
Add tstest.PanicOnLog(), and fix various problems detected by this.
If a test calls log.Printf, 'go test' horrifyingly rearranges the
output to no longer be in chronological order, which makes debugging
virtually impossible. Let's stop that from happening by making
log.Printf panic if called from any module, no matter how deep, during
tests.
This required us to change the default error handler in at least one
http.Server, as well as plumbing a bunch of logf functions around,
especially in magicsock and wgengine, but also in logtail and backoff.
To add insult to injury, 'go test' also rearranges the output when a
parent test has multiple sub-tests (all the sub-test's t.Logf is always
printed after all the parent tests t.Logf), so we need to screw around
with a special Logf that can point at the "current" t (current_t.Logf)
in some places. Probably our entire way of using subtests is wrong,
since 'go test' would probably like to run them all in parallel if you
called t.Parallel(), but it definitely can't because the're all
manipulating the shared state created by the parent test. They should
probably all be separate toplevel tests instead, with common
setup/teardown logic. But that's a job for another time.
Signed-off-by: Avery Pennarun <apenwarr@tailscale.com>
2020-05-13 22:59:54 -04:00
|
|
|
"tailscale.com/types/logger"
|
2020-02-05 14:16:58 -08:00
|
|
|
"tailscale.com/wgengine/packet"
|
|
|
|
)
|
|
|
|
|
2020-03-25 03:47:55 -04:00
|
|
|
type filterState struct {
|
|
|
|
mu sync.Mutex
|
2020-03-25 08:40:36 -07:00
|
|
|
lru *lru.Cache // of tuple
|
2020-03-25 03:47:55 -04:00
|
|
|
}
|
|
|
|
|
2020-03-25 08:40:36 -07:00
|
|
|
// Filter is a stateful packet filter.
|
2020-02-05 14:16:58 -08:00
|
|
|
type Filter struct {
|
2020-05-22 02:41:18 +00:00
|
|
|
logf logger.Logf
|
|
|
|
// localNets is the list of IP prefixes that we know to be "local"
|
|
|
|
// to this node. All packets coming in over tailscale must have a
|
|
|
|
// destination within localNets, regardless of the policy filter
|
|
|
|
// below. A nil localNets rejects all incoming traffic.
|
|
|
|
localNets []Net
|
|
|
|
// matches is a list of match->action rules applied to all packets
|
|
|
|
// arriving over tailscale tunnels. Matches are checked in order,
|
|
|
|
// and processing stops at the first matching rule. The default
|
|
|
|
// policy if no rules match is to drop the packet.
|
2020-02-05 14:16:58 -08:00
|
|
|
matches Matches
|
2020-05-22 02:41:18 +00:00
|
|
|
// state is the connection tracking state attached to this
|
|
|
|
// filter. It is used to allow incoming traffic that is a response
|
|
|
|
// to an outbound connection that this node made, even if those
|
|
|
|
// incoming packets don't get accepted by matches above.
|
|
|
|
state *filterState
|
2020-02-05 14:16:58 -08:00
|
|
|
}
|
|
|
|
|
2020-03-25 08:40:36 -07:00
|
|
|
// Response is a verdict: either a Drop, Accept, or noVerdict skip to
|
|
|
|
// continue processing.
|
2020-02-05 14:16:58 -08:00
|
|
|
type Response int
|
|
|
|
|
|
|
|
const (
|
|
|
|
Drop Response = iota
|
|
|
|
Accept
|
|
|
|
noVerdict // Returned from subfilters to continue processing.
|
|
|
|
)
|
|
|
|
|
|
|
|
func (r Response) String() string {
|
|
|
|
switch r {
|
|
|
|
case Drop:
|
|
|
|
return "Drop"
|
|
|
|
case Accept:
|
|
|
|
return "Accept"
|
|
|
|
case noVerdict:
|
|
|
|
return "noVerdict"
|
|
|
|
default:
|
|
|
|
return "???"
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-03-25 08:40:36 -07:00
|
|
|
// RunFlags controls the filter's debug log verbosity at runtime.
|
2020-02-05 14:16:58 -08:00
|
|
|
type RunFlags int
|
|
|
|
|
|
|
|
const (
|
|
|
|
LogDrops RunFlags = 1 << iota
|
|
|
|
LogAccepts
|
|
|
|
HexdumpDrops
|
|
|
|
HexdumpAccepts
|
|
|
|
)
|
|
|
|
|
|
|
|
type tuple struct {
|
2020-05-11 07:19:17 -07:00
|
|
|
SrcIP packet.IP
|
|
|
|
DstIP packet.IP
|
2020-02-05 14:16:58 -08:00
|
|
|
SrcPort uint16
|
|
|
|
DstPort uint16
|
|
|
|
}
|
|
|
|
|
2020-03-25 08:40:36 -07:00
|
|
|
const lruMax = 512 // max entries in UDP LRU cache
|
2020-02-05 14:16:58 -08:00
|
|
|
|
2020-03-25 08:40:36 -07:00
|
|
|
// MatchAllowAll matches all packets.
|
2020-02-05 14:16:58 -08:00
|
|
|
var MatchAllowAll = Matches{
|
2020-04-30 01:49:17 -04:00
|
|
|
Match{[]NetPortRange{NetPortRangeAny}, []Net{NetAny}},
|
2020-02-05 14:16:58 -08:00
|
|
|
}
|
|
|
|
|
2020-05-22 02:41:18 +00:00
|
|
|
// NewAllowAll returns a packet filter that accepts everything to and
|
|
|
|
// from localNets.
|
|
|
|
func NewAllowAll(localNets []Net, logf logger.Logf) *Filter {
|
|
|
|
return New(MatchAllowAll, localNets, nil, logf)
|
2020-02-05 14:16:58 -08:00
|
|
|
}
|
|
|
|
|
2020-03-25 08:40:36 -07:00
|
|
|
// NewAllowNone returns a packet filter that rejects everything.
|
Add tstest.PanicOnLog(), and fix various problems detected by this.
If a test calls log.Printf, 'go test' horrifyingly rearranges the
output to no longer be in chronological order, which makes debugging
virtually impossible. Let's stop that from happening by making
log.Printf panic if called from any module, no matter how deep, during
tests.
This required us to change the default error handler in at least one
http.Server, as well as plumbing a bunch of logf functions around,
especially in magicsock and wgengine, but also in logtail and backoff.
To add insult to injury, 'go test' also rearranges the output when a
parent test has multiple sub-tests (all the sub-test's t.Logf is always
printed after all the parent tests t.Logf), so we need to screw around
with a special Logf that can point at the "current" t (current_t.Logf)
in some places. Probably our entire way of using subtests is wrong,
since 'go test' would probably like to run them all in parallel if you
called t.Parallel(), but it definitely can't because the're all
manipulating the shared state created by the parent test. They should
probably all be separate toplevel tests instead, with common
setup/teardown logic. But that's a job for another time.
Signed-off-by: Avery Pennarun <apenwarr@tailscale.com>
2020-05-13 22:59:54 -04:00
|
|
|
func NewAllowNone(logf logger.Logf) *Filter {
|
2020-05-22 02:41:18 +00:00
|
|
|
return New(nil, nil, nil, logf)
|
2020-02-05 14:16:58 -08:00
|
|
|
}
|
|
|
|
|
2020-05-22 02:41:18 +00:00
|
|
|
// New creates a new packet filter. The filter enforces that incoming
|
|
|
|
// packets must be destined to an IP in localNets, and must be allowed
|
|
|
|
// by matches. If shareStateWith is non-nil, the returned filter
|
|
|
|
// shares state with the previous one, to enable rules to be changed
|
|
|
|
// at runtime without breaking existing flows.
|
|
|
|
func New(matches Matches, localNets []Net, shareStateWith *Filter, logf logger.Logf) *Filter {
|
2020-03-25 03:47:55 -04:00
|
|
|
var state *filterState
|
|
|
|
if shareStateWith != nil {
|
|
|
|
state = shareStateWith.state
|
|
|
|
} else {
|
|
|
|
state = &filterState{
|
2020-03-25 08:40:36 -07:00
|
|
|
lru: lru.New(lruMax),
|
2020-03-25 03:47:55 -04:00
|
|
|
}
|
|
|
|
}
|
2020-02-05 14:16:58 -08:00
|
|
|
f := &Filter{
|
2020-05-22 02:41:18 +00:00
|
|
|
logf: logf,
|
|
|
|
matches: matches,
|
|
|
|
localNets: localNets,
|
|
|
|
state: state,
|
2020-02-05 14:16:58 -08:00
|
|
|
}
|
|
|
|
return f
|
|
|
|
}
|
|
|
|
|
|
|
|
func maybeHexdump(flag RunFlags, b []byte) string {
|
2020-05-08 12:30:22 -06:00
|
|
|
if flag == 0 {
|
2020-02-05 14:16:58 -08:00
|
|
|
return ""
|
|
|
|
}
|
2020-05-08 12:30:22 -06:00
|
|
|
return packet.Hexdump(b) + "\n"
|
2020-02-05 14:16:58 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
// TODO(apenwarr): use a bigger bucket for specifically TCP SYN accept logging?
|
|
|
|
// Logging is a quick way to record every newly opened TCP connection, but
|
|
|
|
// we have to be cautious about flooding the logs vs letting people use
|
|
|
|
// flood protection to hide their traffic. We could use a rate limiter in
|
|
|
|
// the actual *filter* for SYN accepts, perhaps.
|
2020-05-08 12:30:22 -06:00
|
|
|
var acceptBucket = rate.NewLimiter(rate.Every(10*time.Second), 3)
|
|
|
|
var dropBucket = rate.NewLimiter(rate.Every(5*time.Second), 10)
|
2020-02-05 14:16:58 -08:00
|
|
|
|
2020-06-08 18:19:26 -04:00
|
|
|
func (f *Filter) logRateLimit(runflags RunFlags, q *packet.ParsedPacket, r Response, why string) {
|
2020-06-02 08:09:20 -04:00
|
|
|
var verdict string
|
|
|
|
|
2020-05-08 12:30:22 -06:00
|
|
|
if r == Drop && (runflags&LogDrops) != 0 && dropBucket.Allow() {
|
2020-06-02 08:09:20 -04:00
|
|
|
verdict = "Drop"
|
|
|
|
runflags &= HexdumpDrops
|
|
|
|
} else if r == Accept && (runflags&LogAccepts) != 0 && acceptBucket.Allow() {
|
|
|
|
verdict = "Accept"
|
|
|
|
runflags &= HexdumpAccepts
|
|
|
|
}
|
|
|
|
|
|
|
|
// Note: it is crucial that q.String() be called only if {accept,drop}Bucket.Allow() passes,
|
|
|
|
// since it causes an allocation.
|
|
|
|
if verdict != "" {
|
2020-06-08 18:19:26 -04:00
|
|
|
b := q.Buffer()
|
|
|
|
f.logf("%s: %s %d %s\n%s", verdict, q.String(), len(b), why, maybeHexdump(runflags, b))
|
2020-02-05 14:16:58 -08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-06-08 18:19:26 -04:00
|
|
|
// RunIn determines whether this node is allowed to receive q from a Tailscale peer.
|
|
|
|
func (f *Filter) RunIn(q *packet.ParsedPacket, rf RunFlags) Response {
|
|
|
|
r := f.pre(q, rf)
|
2020-02-05 14:16:58 -08:00
|
|
|
if r == Accept || r == Drop {
|
|
|
|
// already logged
|
|
|
|
return r
|
|
|
|
}
|
|
|
|
|
|
|
|
r, why := f.runIn(q)
|
2020-06-08 18:19:26 -04:00
|
|
|
f.logRateLimit(rf, q, r, why)
|
2020-02-05 14:16:58 -08:00
|
|
|
return r
|
|
|
|
}
|
|
|
|
|
2020-06-08 18:19:26 -04:00
|
|
|
// RunOut determines whether this node is allowed to send q to a Tailscale peer.
|
|
|
|
func (f *Filter) RunOut(q *packet.ParsedPacket, rf RunFlags) Response {
|
|
|
|
r := f.pre(q, rf)
|
2020-02-05 14:16:58 -08:00
|
|
|
if r == Drop || r == Accept {
|
|
|
|
// already logged
|
|
|
|
return r
|
|
|
|
}
|
|
|
|
r, why := f.runOut(q)
|
2020-06-08 18:19:26 -04:00
|
|
|
f.logRateLimit(rf, q, r, why)
|
2020-02-05 14:16:58 -08:00
|
|
|
return r
|
|
|
|
}
|
|
|
|
|
2020-06-04 18:42:44 -04:00
|
|
|
func (f *Filter) runIn(q *packet.ParsedPacket) (r Response, why string) {
|
2020-05-22 02:41:18 +00:00
|
|
|
// A compromised peer could try to send us packets for
|
|
|
|
// destinations we didn't explicitly advertise. This check is to
|
|
|
|
// prevent that.
|
|
|
|
if !ipInList(q.DstIP, f.localNets) {
|
|
|
|
return Drop, "destination not allowed"
|
|
|
|
}
|
|
|
|
|
2020-02-05 14:16:58 -08:00
|
|
|
switch q.IPProto {
|
|
|
|
case packet.ICMP:
|
2020-04-29 03:53:32 -04:00
|
|
|
if q.IsEchoResponse() || q.IsError() {
|
|
|
|
// ICMP responses are allowed.
|
|
|
|
// TODO(apenwarr): consider using conntrack state.
|
|
|
|
// We could choose to reject all packets that aren't
|
|
|
|
// related to an existing ICMP-Echo, TCP, or UDP
|
|
|
|
// session.
|
|
|
|
return Accept, "icmp response ok"
|
|
|
|
} else if matchIPWithoutPorts(f.matches, q) {
|
|
|
|
// If any port is open to an IP, allow ICMP to it.
|
2020-02-05 14:16:58 -08:00
|
|
|
return Accept, "icmp ok"
|
|
|
|
}
|
|
|
|
case packet.TCP:
|
|
|
|
// For TCP, we want to allow *outgoing* connections,
|
|
|
|
// which means we want to allow return packets on those
|
|
|
|
// connections. To make this restriction work, we need to
|
|
|
|
// allow non-SYN packets (continuation of an existing session)
|
|
|
|
// to arrive. This should be okay since a new incoming session
|
|
|
|
// can't be initiated without first sending a SYN.
|
|
|
|
// It happens to also be much faster.
|
|
|
|
// TODO(apenwarr): Skip the rest of decoding in this path?
|
|
|
|
if q.IPProto == packet.TCP && !q.IsTCPSyn() {
|
|
|
|
return Accept, "tcp non-syn"
|
|
|
|
}
|
|
|
|
if matchIPPorts(f.matches, q) {
|
|
|
|
return Accept, "tcp ok"
|
|
|
|
}
|
|
|
|
case packet.UDP:
|
|
|
|
t := tuple{q.SrcIP, q.DstIP, q.SrcPort, q.DstPort}
|
|
|
|
|
2020-03-25 03:47:55 -04:00
|
|
|
f.state.mu.Lock()
|
|
|
|
_, ok := f.state.lru.Get(t)
|
|
|
|
f.state.mu.Unlock()
|
2020-02-05 14:16:58 -08:00
|
|
|
|
|
|
|
if ok {
|
|
|
|
return Accept, "udp cached"
|
|
|
|
}
|
|
|
|
if matchIPPorts(f.matches, q) {
|
|
|
|
return Accept, "udp ok"
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
return Drop, "Unknown proto"
|
|
|
|
}
|
|
|
|
return Drop, "no rules matched"
|
|
|
|
}
|
|
|
|
|
2020-06-04 18:42:44 -04:00
|
|
|
func (f *Filter) runOut(q *packet.ParsedPacket) (r Response, why string) {
|
2020-02-05 14:16:58 -08:00
|
|
|
if q.IPProto == packet.UDP {
|
|
|
|
t := tuple{q.DstIP, q.SrcIP, q.DstPort, q.SrcPort}
|
2020-03-25 08:40:36 -07:00
|
|
|
var ti interface{} = t // allocate once, rather than twice inside mutex
|
2020-02-05 14:16:58 -08:00
|
|
|
|
2020-03-25 03:47:55 -04:00
|
|
|
f.state.mu.Lock()
|
2020-03-25 08:40:36 -07:00
|
|
|
f.state.lru.Add(ti, ti)
|
2020-03-25 03:47:55 -04:00
|
|
|
f.state.mu.Unlock()
|
2020-02-05 14:16:58 -08:00
|
|
|
}
|
|
|
|
return Accept, "ok out"
|
|
|
|
}
|
|
|
|
|
2020-06-08 18:19:26 -04:00
|
|
|
func (f *Filter) pre(q *packet.ParsedPacket, rf RunFlags) Response {
|
|
|
|
if len(q.Buffer()) == 0 {
|
2020-02-05 14:16:58 -08:00
|
|
|
// wireguard keepalive packet, always permit.
|
|
|
|
return Accept
|
|
|
|
}
|
2020-06-08 18:19:26 -04:00
|
|
|
if len(q.Buffer()) < 20 {
|
|
|
|
f.logRateLimit(rf, q, Drop, "too short")
|
2020-02-05 14:16:58 -08:00
|
|
|
return Drop
|
|
|
|
}
|
|
|
|
|
2020-06-04 18:42:44 -04:00
|
|
|
switch q.IPProto {
|
|
|
|
case packet.Unknown:
|
|
|
|
// Unknown packets are dangerous; always drop them.
|
2020-06-08 18:19:26 -04:00
|
|
|
f.logRateLimit(rf, q, Drop, "unknown")
|
2020-06-04 18:42:44 -04:00
|
|
|
return Drop
|
|
|
|
case packet.IPv6:
|
2020-06-08 18:19:26 -04:00
|
|
|
f.logRateLimit(rf, q, Drop, "ipv6")
|
2020-02-05 14:16:58 -08:00
|
|
|
return Drop
|
2020-06-04 18:42:44 -04:00
|
|
|
case packet.Fragment:
|
2020-02-05 14:16:58 -08:00
|
|
|
// Fragments after the first always need to be passed through.
|
2020-06-04 18:42:44 -04:00
|
|
|
// Very small fragments are considered Junk by ParsedPacket.
|
2020-06-08 18:19:26 -04:00
|
|
|
f.logRateLimit(rf, q, Accept, "fragment")
|
2020-02-05 14:16:58 -08:00
|
|
|
return Accept
|
|
|
|
}
|
|
|
|
|
|
|
|
return noVerdict
|
|
|
|
}
|