2023-01-27 13:37:20 -08:00
|
|
|
// Copyright (c) Tailscale Inc & AUTHORS
|
|
|
|
// SPDX-License-Identifier: BSD-3-Clause
|
2023-01-18 11:41:58 -05:00
|
|
|
|
2023-02-14 17:57:02 -08:00
|
|
|
// testwrapper is a wrapper for retrying flaky tests. It is an alternative to
|
|
|
|
// `go test` and re-runs failed marked flaky tests (using the flakytest pkg). It
|
|
|
|
// takes different arguments than go test and requires the first positional
|
|
|
|
// argument to be the pattern to test.
|
2023-01-18 11:41:58 -05:00
|
|
|
package main
|
|
|
|
|
|
|
|
import (
|
2023-09-07 17:18:26 +01:00
|
|
|
"bufio"
|
2023-02-14 17:57:02 -08:00
|
|
|
"bytes"
|
2023-01-18 11:41:58 -05:00
|
|
|
"context"
|
2023-02-14 17:57:02 -08:00
|
|
|
"encoding/json"
|
2023-01-18 11:41:58 -05:00
|
|
|
"errors"
|
2023-02-14 17:57:02 -08:00
|
|
|
"fmt"
|
|
|
|
"io"
|
2023-01-18 11:41:58 -05:00
|
|
|
"log"
|
|
|
|
"os"
|
|
|
|
"os/exec"
|
2023-10-03 19:12:37 -07:00
|
|
|
"slices"
|
2023-02-14 17:57:02 -08:00
|
|
|
"sort"
|
|
|
|
"strings"
|
|
|
|
"time"
|
2023-01-18 11:41:58 -05:00
|
|
|
|
2023-08-17 09:40:19 -07:00
|
|
|
xmaps "golang.org/x/exp/maps"
|
2023-02-14 17:57:02 -08:00
|
|
|
"tailscale.com/cmd/testwrapper/flakytest"
|
2023-01-18 11:41:58 -05:00
|
|
|
)
|
|
|
|
|
2023-02-14 17:57:02 -08:00
|
|
|
const maxAttempts = 3
|
|
|
|
|
|
|
|
type testAttempt struct {
|
2023-09-04 14:56:08 -07:00
|
|
|
pkg string // "tailscale.com/types/key"
|
|
|
|
testName string // "TestFoo"
|
2023-02-14 17:57:02 -08:00
|
|
|
outcome string // "pass", "fail", "skip"
|
|
|
|
logs bytes.Buffer
|
2023-09-28 16:30:12 -07:00
|
|
|
isMarkedFlaky bool // set if the test is marked as flaky
|
|
|
|
issueURL string // set if the test is marked as flaky
|
2023-06-30 12:21:52 -07:00
|
|
|
|
|
|
|
pkgFinished bool
|
2023-02-14 17:57:02 -08:00
|
|
|
}
|
|
|
|
|
2023-09-28 16:30:12 -07:00
|
|
|
// packageTests describes what to run.
|
|
|
|
// It's also JSON-marshalled to output for analysys tools to parse
|
|
|
|
// so the fields are all exported.
|
|
|
|
// TODO(bradfitz): move this type to its own types package?
|
2023-02-14 17:57:02 -08:00
|
|
|
type packageTests struct {
|
2023-09-28 14:08:56 -07:00
|
|
|
// Pattern is the package Pattern to run.
|
|
|
|
// Must be a single Pattern, not a list of patterns.
|
|
|
|
Pattern string // "./...", "./types/key"
|
|
|
|
// Tests is a list of Tests to run. If empty, all Tests in the package are
|
2023-02-14 17:57:02 -08:00
|
|
|
// run.
|
2023-09-28 14:08:56 -07:00
|
|
|
Tests []string // ["TestFoo", "TestBar"]
|
2023-09-28 16:30:12 -07:00
|
|
|
// IssueURLs maps from a test name to a URL tracking its flake.
|
|
|
|
IssueURLs map[string]string // "TestFoo" => "https://github.com/foo/bar/issue/123"
|
2023-02-14 17:57:02 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
type goTestOutput struct {
|
|
|
|
Time time.Time
|
|
|
|
Action string
|
|
|
|
Package string
|
|
|
|
Test string
|
|
|
|
Output string
|
|
|
|
}
|
|
|
|
|
|
|
|
var debug = os.Getenv("TS_TESTWRAPPER_DEBUG") != ""
|
2023-01-18 11:41:58 -05:00
|
|
|
|
2023-06-30 12:21:52 -07:00
|
|
|
// runTests runs the tests in pt and sends the results on ch. It sends a
|
|
|
|
// testAttempt for each test and a final testAttempt per pkg with pkgFinished
|
2023-09-07 17:18:26 +01:00
|
|
|
// set to true. Package build errors will not emit a testAttempt (as no valid
|
|
|
|
// JSON is produced) but the [os/exec.ExitError] will be returned.
|
2023-06-30 12:21:52 -07:00
|
|
|
// It calls close(ch) when it's done.
|
2023-10-14 16:56:08 -07:00
|
|
|
func runTests(ctx context.Context, attempt int, pt *packageTests, goTestArgs, testArgs []string, ch chan<- *testAttempt) error {
|
2023-06-30 12:21:52 -07:00
|
|
|
defer close(ch)
|
2023-10-14 16:56:08 -07:00
|
|
|
args := []string{"test"}
|
|
|
|
args = append(args, goTestArgs...)
|
2023-10-13 12:29:28 -07:00
|
|
|
args = append(args, pt.Pattern)
|
2023-09-28 14:08:56 -07:00
|
|
|
if len(pt.Tests) > 0 {
|
|
|
|
runArg := strings.Join(pt.Tests, "|")
|
2023-10-13 12:29:28 -07:00
|
|
|
args = append(args, "--run", runArg)
|
2023-01-18 11:41:58 -05:00
|
|
|
}
|
2023-10-14 16:56:08 -07:00
|
|
|
args = append(args, testArgs...)
|
|
|
|
args = append(args, "-json")
|
2023-02-14 17:57:02 -08:00
|
|
|
if debug {
|
|
|
|
fmt.Println("running", strings.Join(args, " "))
|
|
|
|
}
|
|
|
|
cmd := exec.CommandContext(ctx, "go", args...)
|
2023-10-16 18:47:03 -07:00
|
|
|
if len(pt.Tests) > 0 {
|
|
|
|
cmd.Env = append(os.Environ(), "TS_TEST_SHARD=") // clear test shard; run all tests we say to run
|
|
|
|
}
|
2023-02-14 17:57:02 -08:00
|
|
|
r, err := cmd.StdoutPipe()
|
|
|
|
if err != nil {
|
|
|
|
log.Printf("error creating stdout pipe: %v", err)
|
|
|
|
}
|
2023-07-02 09:01:53 -07:00
|
|
|
defer r.Close()
|
2023-02-14 17:57:02 -08:00
|
|
|
cmd.Stderr = os.Stderr
|
|
|
|
|
|
|
|
cmd.Env = os.Environ()
|
|
|
|
cmd.Env = append(cmd.Env, fmt.Sprintf("%s=%d", flakytest.FlakeAttemptEnv, attempt))
|
2023-01-18 11:41:58 -05:00
|
|
|
|
2023-02-14 17:57:02 -08:00
|
|
|
if err := cmd.Start(); err != nil {
|
|
|
|
log.Printf("error starting test: %v", err)
|
|
|
|
os.Exit(1)
|
|
|
|
}
|
|
|
|
|
2023-09-07 17:18:26 +01:00
|
|
|
s := bufio.NewScanner(r)
|
2023-09-04 14:56:08 -07:00
|
|
|
resultMap := make(map[string]map[string]*testAttempt) // pkg -> test -> testAttempt
|
2023-09-07 17:18:26 +01:00
|
|
|
for s.Scan() {
|
2023-02-14 17:57:02 -08:00
|
|
|
var goOutput goTestOutput
|
2023-09-07 17:18:26 +01:00
|
|
|
if err := json.Unmarshal(s.Bytes(), &goOutput); err != nil {
|
2023-02-14 17:57:02 -08:00
|
|
|
if errors.Is(err, io.EOF) || errors.Is(err, os.ErrClosed) {
|
|
|
|
break
|
|
|
|
}
|
2023-07-02 09:01:53 -07:00
|
|
|
|
|
|
|
// `go test -json` outputs invalid JSON when a build fails.
|
|
|
|
// In that case, discard the the output and start reading again.
|
|
|
|
// The build error will be printed to stderr.
|
|
|
|
// See: https://github.com/golang/go/issues/35169
|
|
|
|
if _, ok := err.(*json.SyntaxError); ok {
|
2023-09-07 17:18:26 +01:00
|
|
|
fmt.Println(s.Text())
|
2023-07-02 09:01:53 -07:00
|
|
|
continue
|
|
|
|
}
|
2023-02-14 17:57:02 -08:00
|
|
|
panic(err)
|
2023-01-18 11:41:58 -05:00
|
|
|
}
|
2023-09-04 14:56:08 -07:00
|
|
|
pkg := goOutput.Package
|
|
|
|
pkgTests := resultMap[pkg]
|
2023-02-14 17:57:02 -08:00
|
|
|
if goOutput.Test == "" {
|
2023-06-30 12:21:52 -07:00
|
|
|
switch goOutput.Action {
|
|
|
|
case "fail", "pass", "skip":
|
2023-09-04 14:56:08 -07:00
|
|
|
for _, test := range pkgTests {
|
|
|
|
if test.outcome == "" {
|
|
|
|
test.outcome = "fail"
|
|
|
|
ch <- test
|
|
|
|
}
|
|
|
|
}
|
2023-06-30 12:21:52 -07:00
|
|
|
ch <- &testAttempt{
|
2023-09-04 14:56:08 -07:00
|
|
|
pkg: goOutput.Package,
|
2023-06-30 12:21:52 -07:00
|
|
|
outcome: goOutput.Action,
|
|
|
|
pkgFinished: true,
|
|
|
|
}
|
|
|
|
}
|
2023-02-14 17:57:02 -08:00
|
|
|
continue
|
|
|
|
}
|
2023-09-04 14:56:08 -07:00
|
|
|
if pkgTests == nil {
|
|
|
|
pkgTests = make(map[string]*testAttempt)
|
|
|
|
resultMap[pkg] = pkgTests
|
2023-02-14 17:57:02 -08:00
|
|
|
}
|
2023-09-04 14:56:08 -07:00
|
|
|
testName := goOutput.Test
|
2023-02-14 17:57:02 -08:00
|
|
|
if test, _, isSubtest := strings.Cut(goOutput.Test, "/"); isSubtest {
|
2023-09-04 14:56:08 -07:00
|
|
|
testName = test
|
2023-02-14 17:57:02 -08:00
|
|
|
if goOutput.Action == "output" {
|
2023-09-04 14:56:08 -07:00
|
|
|
resultMap[pkg][testName].logs.WriteString(goOutput.Output)
|
2023-02-14 17:57:02 -08:00
|
|
|
}
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
switch goOutput.Action {
|
|
|
|
case "start":
|
|
|
|
// ignore
|
|
|
|
case "run":
|
2023-09-04 14:56:08 -07:00
|
|
|
pkgTests[testName] = &testAttempt{
|
|
|
|
pkg: pkg,
|
|
|
|
testName: testName,
|
2023-02-14 17:57:02 -08:00
|
|
|
}
|
|
|
|
case "skip", "pass", "fail":
|
2023-09-04 14:56:08 -07:00
|
|
|
pkgTests[testName].outcome = goOutput.Action
|
|
|
|
ch <- pkgTests[testName]
|
2023-02-14 17:57:02 -08:00
|
|
|
case "output":
|
2023-09-28 16:30:12 -07:00
|
|
|
if suffix, ok := strings.CutPrefix(strings.TrimSpace(goOutput.Output), flakytest.FlakyTestLogMessage); ok {
|
2023-09-04 14:56:08 -07:00
|
|
|
pkgTests[testName].isMarkedFlaky = true
|
2023-09-28 16:30:12 -07:00
|
|
|
pkgTests[testName].issueURL = strings.TrimPrefix(suffix, ": ")
|
2023-02-14 17:57:02 -08:00
|
|
|
} else {
|
2023-09-04 14:56:08 -07:00
|
|
|
pkgTests[testName].logs.WriteString(goOutput.Output)
|
2023-02-14 17:57:02 -08:00
|
|
|
}
|
2023-01-18 11:41:58 -05:00
|
|
|
}
|
2023-02-14 17:57:02 -08:00
|
|
|
}
|
2023-09-11 19:06:11 +01:00
|
|
|
if err := cmd.Wait(); err != nil {
|
2023-09-07 17:18:26 +01:00
|
|
|
return err
|
|
|
|
}
|
2023-09-11 19:06:11 +01:00
|
|
|
if err := s.Err(); err != nil {
|
|
|
|
return fmt.Errorf("reading go test stdout: %w", err)
|
|
|
|
}
|
|
|
|
return nil
|
2023-02-14 17:57:02 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
func main() {
|
2023-10-14 16:56:08 -07:00
|
|
|
goTestArgs, packages, testArgs, err := splitArgs(os.Args[1:])
|
|
|
|
if err != nil {
|
|
|
|
log.Fatal(err)
|
|
|
|
return
|
2023-02-14 17:57:02 -08:00
|
|
|
}
|
2023-10-14 16:56:08 -07:00
|
|
|
if len(packages) == 0 {
|
|
|
|
fmt.Println("testwrapper: no packages specified")
|
|
|
|
return
|
2023-02-14 17:57:02 -08:00
|
|
|
}
|
|
|
|
|
2023-10-14 16:56:08 -07:00
|
|
|
ctx := context.Background()
|
2023-06-30 09:31:07 -07:00
|
|
|
type nextRun struct {
|
|
|
|
tests []*packageTests
|
2023-09-28 14:08:56 -07:00
|
|
|
attempt int // starting at 1
|
2023-02-14 17:57:02 -08:00
|
|
|
}
|
2023-10-14 16:56:08 -07:00
|
|
|
firstRun := &nextRun{
|
|
|
|
attempt: 1,
|
|
|
|
}
|
|
|
|
for _, pkg := range packages {
|
|
|
|
firstRun.tests = append(firstRun.tests, &packageTests{Pattern: pkg})
|
2023-06-30 09:31:07 -07:00
|
|
|
}
|
2023-10-14 16:56:08 -07:00
|
|
|
toRun := []*nextRun{firstRun}
|
2023-06-30 12:21:52 -07:00
|
|
|
printPkgOutcome := func(pkg, outcome string, attempt int) {
|
|
|
|
if outcome == "skip" {
|
|
|
|
fmt.Printf("?\t%s [skipped/no tests] \n", pkg)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
if outcome == "pass" {
|
|
|
|
outcome = "ok"
|
2023-06-30 09:31:07 -07:00
|
|
|
}
|
2023-06-30 12:21:52 -07:00
|
|
|
if outcome == "fail" {
|
|
|
|
outcome = "FAIL"
|
|
|
|
}
|
|
|
|
if attempt > 1 {
|
|
|
|
fmt.Printf("%s\t%s [attempt=%d]\n", outcome, pkg, attempt)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
fmt.Printf("%s\t%s\n", outcome, pkg)
|
2023-06-30 09:31:07 -07:00
|
|
|
}
|
2023-02-14 17:57:02 -08:00
|
|
|
|
|
|
|
for len(toRun) > 0 {
|
2023-06-30 09:31:07 -07:00
|
|
|
var thisRun *nextRun
|
|
|
|
thisRun, toRun = toRun[0], toRun[1:]
|
2023-02-14 17:57:02 -08:00
|
|
|
|
2023-08-24 16:48:22 -04:00
|
|
|
if thisRun.attempt > maxAttempts {
|
2023-06-30 09:31:07 -07:00
|
|
|
fmt.Println("max attempts reached")
|
|
|
|
os.Exit(1)
|
|
|
|
}
|
|
|
|
if thisRun.attempt > 1 {
|
2023-09-28 14:08:56 -07:00
|
|
|
j, _ := json.Marshal(thisRun.tests)
|
2023-09-28 16:30:12 -07:00
|
|
|
fmt.Printf("\n\nAttempt #%d: Retrying flaky tests:\n\nflakytest failures JSON: %s\n\n", thisRun.attempt, j)
|
2023-06-30 09:31:07 -07:00
|
|
|
}
|
2023-02-14 17:57:02 -08:00
|
|
|
|
2023-09-28 16:30:12 -07:00
|
|
|
toRetry := make(map[string][]*testAttempt) // pkg -> tests to retry
|
2023-06-30 09:31:07 -07:00
|
|
|
for _, pt := range thisRun.tests {
|
2023-06-30 12:21:52 -07:00
|
|
|
ch := make(chan *testAttempt)
|
2023-09-07 17:18:26 +01:00
|
|
|
runErr := make(chan error, 1)
|
|
|
|
go func() {
|
|
|
|
defer close(runErr)
|
2023-10-14 16:56:08 -07:00
|
|
|
runErr <- runTests(ctx, thisRun.attempt, pt, goTestArgs, testArgs, ch)
|
2023-09-07 17:18:26 +01:00
|
|
|
}()
|
|
|
|
|
|
|
|
var failed bool
|
2023-06-30 12:21:52 -07:00
|
|
|
for tr := range ch {
|
2023-09-07 17:18:26 +01:00
|
|
|
// Go assigns the package name "command-line-arguments" when you
|
|
|
|
// `go test FILE` rather than `go test PKG`. It's more
|
|
|
|
// convenient for us to to specify files in tests, so fix tr.pkg
|
|
|
|
// so that subsequent testwrapper attempts run correctly.
|
|
|
|
if tr.pkg == "command-line-arguments" {
|
2023-10-14 16:56:08 -07:00
|
|
|
tr.pkg = packages[0]
|
2023-09-07 17:18:26 +01:00
|
|
|
}
|
2023-06-30 12:21:52 -07:00
|
|
|
if tr.pkgFinished {
|
2023-09-04 14:56:08 -07:00
|
|
|
if tr.outcome == "fail" && len(toRetry[tr.pkg]) == 0 {
|
2023-08-29 18:03:13 -07:00
|
|
|
// If a package fails and we don't have any tests to
|
|
|
|
// retry, then we should fail. This typically happens
|
|
|
|
// when a package times out.
|
|
|
|
failed = true
|
|
|
|
}
|
2023-09-04 14:56:08 -07:00
|
|
|
printPkgOutcome(tr.pkg, tr.outcome, thisRun.attempt)
|
2023-06-30 12:21:52 -07:00
|
|
|
continue
|
2023-06-30 09:31:07 -07:00
|
|
|
}
|
2023-10-14 16:56:08 -07:00
|
|
|
if testingVerbose || tr.outcome == "fail" {
|
2023-06-30 09:31:07 -07:00
|
|
|
io.Copy(os.Stdout, &tr.logs)
|
|
|
|
}
|
|
|
|
if tr.outcome != "fail" {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if tr.isMarkedFlaky {
|
2023-09-28 16:30:12 -07:00
|
|
|
toRetry[tr.pkg] = append(toRetry[tr.pkg], tr)
|
2023-06-30 09:31:07 -07:00
|
|
|
} else {
|
|
|
|
failed = true
|
|
|
|
}
|
2023-02-14 17:57:02 -08:00
|
|
|
}
|
2023-09-07 17:18:26 +01:00
|
|
|
if failed {
|
|
|
|
fmt.Println("\n\nNot retrying flaky tests because non-flaky tests failed.")
|
|
|
|
os.Exit(1)
|
|
|
|
}
|
|
|
|
|
|
|
|
// If there's nothing to retry and no non-retryable tests have
|
|
|
|
// failed then we've probably hit a build error.
|
|
|
|
if err := <-runErr; len(toRetry) == 0 && err != nil {
|
|
|
|
var exit *exec.ExitError
|
|
|
|
if errors.As(err, &exit) {
|
|
|
|
if code := exit.ExitCode(); code > -1 {
|
|
|
|
os.Exit(exit.ExitCode())
|
|
|
|
}
|
|
|
|
}
|
2023-09-11 19:06:11 +01:00
|
|
|
log.Printf("testwrapper: %s", err)
|
|
|
|
os.Exit(1)
|
2023-09-07 17:18:26 +01:00
|
|
|
}
|
2023-01-18 11:41:58 -05:00
|
|
|
}
|
2023-06-30 09:31:07 -07:00
|
|
|
if len(toRetry) == 0 {
|
|
|
|
continue
|
|
|
|
}
|
2023-08-17 09:40:19 -07:00
|
|
|
pkgs := xmaps.Keys(toRetry)
|
2023-02-14 17:57:02 -08:00
|
|
|
sort.Strings(pkgs)
|
2023-06-30 09:31:07 -07:00
|
|
|
nextRun := &nextRun{
|
|
|
|
attempt: thisRun.attempt + 1,
|
|
|
|
}
|
2023-02-14 17:57:02 -08:00
|
|
|
for _, pkg := range pkgs {
|
|
|
|
tests := toRetry[pkg]
|
2023-09-28 16:30:12 -07:00
|
|
|
slices.SortFunc(tests, func(a, b *testAttempt) int { return strings.Compare(a.testName, b.testName) })
|
|
|
|
issueURLs := map[string]string{} // test name => URL
|
|
|
|
var testNames []string
|
|
|
|
for _, ta := range tests {
|
|
|
|
issueURLs[ta.testName] = ta.issueURL
|
|
|
|
testNames = append(testNames, ta.testName)
|
|
|
|
}
|
2023-06-30 09:31:07 -07:00
|
|
|
nextRun.tests = append(nextRun.tests, &packageTests{
|
2023-09-28 16:30:12 -07:00
|
|
|
Pattern: pkg,
|
|
|
|
Tests: testNames,
|
|
|
|
IssueURLs: issueURLs,
|
2023-02-14 17:57:02 -08:00
|
|
|
})
|
2023-01-18 11:41:58 -05:00
|
|
|
}
|
2023-06-30 09:31:07 -07:00
|
|
|
toRun = append(toRun, nextRun)
|
2023-01-18 11:41:58 -05:00
|
|
|
}
|
|
|
|
}
|