mirror of
				https://github.com/tailscale/tailscale.git
				synced 2025-11-04 02:01:14 +01:00 
			
		
		
		
	(Continuing quest to remove rando stuff from the "Engine") Updates #cleanup Change-Id: I77f39902c2194410c10c054b545d70c9744250b0 Signed-off-by: Brad Fitzpatrick <bradfitz@tailscale.com>
		
			
				
	
	
		
			160 lines
		
	
	
		
			4.0 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			160 lines
		
	
	
		
			4.0 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
// Copyright (c) Tailscale Inc & AUTHORS
 | 
						|
// SPDX-License-Identifier: BSD-3-Clause
 | 
						|
 | 
						|
//go:build !js
 | 
						|
 | 
						|
package wgengine
 | 
						|
 | 
						|
import (
 | 
						|
	"fmt"
 | 
						|
	"log"
 | 
						|
	"net/netip"
 | 
						|
	"runtime/pprof"
 | 
						|
	"strings"
 | 
						|
	"sync"
 | 
						|
	"time"
 | 
						|
 | 
						|
	"tailscale.com/envknob"
 | 
						|
	"tailscale.com/ipn/ipnstate"
 | 
						|
	"tailscale.com/net/dns"
 | 
						|
	"tailscale.com/tailcfg"
 | 
						|
	"tailscale.com/types/netmap"
 | 
						|
	"tailscale.com/wgengine/capture"
 | 
						|
	"tailscale.com/wgengine/filter"
 | 
						|
	"tailscale.com/wgengine/router"
 | 
						|
	"tailscale.com/wgengine/wgcfg"
 | 
						|
)
 | 
						|
 | 
						|
// NewWatchdog wraps an Engine and makes sure that all methods complete
 | 
						|
// within a reasonable amount of time.
 | 
						|
//
 | 
						|
// If they do not, the watchdog crashes the process.
 | 
						|
func NewWatchdog(e Engine) Engine {
 | 
						|
	if envknob.Bool("TS_DEBUG_DISABLE_WATCHDOG") {
 | 
						|
		return e
 | 
						|
	}
 | 
						|
	return &watchdogEngine{
 | 
						|
		wrap:     e,
 | 
						|
		logf:     log.Printf,
 | 
						|
		fatalf:   log.Fatalf,
 | 
						|
		maxWait:  45 * time.Second,
 | 
						|
		inFlight: make(map[inFlightKey]time.Time),
 | 
						|
	}
 | 
						|
}
 | 
						|
 | 
						|
type inFlightKey struct {
 | 
						|
	op  string
 | 
						|
	ctr uint64
 | 
						|
}
 | 
						|
 | 
						|
type watchdogEngine struct {
 | 
						|
	wrap    Engine
 | 
						|
	logf    func(format string, args ...any)
 | 
						|
	fatalf  func(format string, args ...any)
 | 
						|
	maxWait time.Duration
 | 
						|
 | 
						|
	// Track the start time(s) of in-flight operations
 | 
						|
	inFlightMu  sync.Mutex
 | 
						|
	inFlight    map[inFlightKey]time.Time
 | 
						|
	inFlightCtr uint64
 | 
						|
}
 | 
						|
 | 
						|
func (e *watchdogEngine) watchdogErr(name string, fn func() error) error {
 | 
						|
	// Track all in-flight operations so we can print more useful error
 | 
						|
	// messages on watchdog failure
 | 
						|
	e.inFlightMu.Lock()
 | 
						|
	key := inFlightKey{
 | 
						|
		op:  name,
 | 
						|
		ctr: e.inFlightCtr,
 | 
						|
	}
 | 
						|
	e.inFlightCtr++
 | 
						|
	e.inFlight[key] = time.Now()
 | 
						|
	e.inFlightMu.Unlock()
 | 
						|
 | 
						|
	defer func() {
 | 
						|
		e.inFlightMu.Lock()
 | 
						|
		defer e.inFlightMu.Unlock()
 | 
						|
		delete(e.inFlight, key)
 | 
						|
	}()
 | 
						|
 | 
						|
	errCh := make(chan error)
 | 
						|
	go func() {
 | 
						|
		errCh <- fn()
 | 
						|
	}()
 | 
						|
	t := time.NewTimer(e.maxWait)
 | 
						|
	select {
 | 
						|
	case err := <-errCh:
 | 
						|
		t.Stop()
 | 
						|
		return err
 | 
						|
	case <-t.C:
 | 
						|
		buf := new(strings.Builder)
 | 
						|
		pprof.Lookup("goroutine").WriteTo(buf, 1)
 | 
						|
		e.logf("wgengine watchdog stacks:\n%s", buf.String())
 | 
						|
 | 
						|
		// Collect the list of in-flight operations for debugging.
 | 
						|
		var (
 | 
						|
			b   []byte
 | 
						|
			now = time.Now()
 | 
						|
		)
 | 
						|
		e.inFlightMu.Lock()
 | 
						|
		for k, t := range e.inFlight {
 | 
						|
			dur := now.Sub(t).Round(time.Millisecond)
 | 
						|
			b = fmt.Appendf(b, "in-flight[%d]: name=%s duration=%v start=%s\n", k.ctr, k.op, dur, t.Format(time.RFC3339Nano))
 | 
						|
		}
 | 
						|
		e.inFlightMu.Unlock()
 | 
						|
 | 
						|
		// Print everything as a single string to avoid log
 | 
						|
		// rate limits.
 | 
						|
		e.logf("wgengine watchdog in-flight:\n%s", b)
 | 
						|
		e.fatalf("wgengine: watchdog timeout on %s", name)
 | 
						|
		return nil
 | 
						|
	}
 | 
						|
}
 | 
						|
 | 
						|
func (e *watchdogEngine) watchdog(name string, fn func()) {
 | 
						|
	e.watchdogErr(name, func() error {
 | 
						|
		fn()
 | 
						|
		return nil
 | 
						|
	})
 | 
						|
}
 | 
						|
 | 
						|
func (e *watchdogEngine) Reconfig(cfg *wgcfg.Config, routerCfg *router.Config, dnsCfg *dns.Config) error {
 | 
						|
	return e.watchdogErr("Reconfig", func() error { return e.wrap.Reconfig(cfg, routerCfg, dnsCfg) })
 | 
						|
}
 | 
						|
func (e *watchdogEngine) GetFilter() *filter.Filter {
 | 
						|
	return e.wrap.GetFilter()
 | 
						|
}
 | 
						|
func (e *watchdogEngine) SetFilter(filt *filter.Filter) {
 | 
						|
	e.watchdog("SetFilter", func() { e.wrap.SetFilter(filt) })
 | 
						|
}
 | 
						|
func (e *watchdogEngine) SetStatusCallback(cb StatusCallback) {
 | 
						|
	e.watchdog("SetStatusCallback", func() { e.wrap.SetStatusCallback(cb) })
 | 
						|
}
 | 
						|
func (e *watchdogEngine) UpdateStatus(sb *ipnstate.StatusBuilder) {
 | 
						|
	e.watchdog("UpdateStatus", func() { e.wrap.UpdateStatus(sb) })
 | 
						|
}
 | 
						|
func (e *watchdogEngine) RequestStatus() {
 | 
						|
	e.watchdog("RequestStatus", func() { e.wrap.RequestStatus() })
 | 
						|
}
 | 
						|
func (e *watchdogEngine) SetNetworkMap(nm *netmap.NetworkMap) {
 | 
						|
	e.watchdog("SetNetworkMap", func() { e.wrap.SetNetworkMap(nm) })
 | 
						|
}
 | 
						|
func (e *watchdogEngine) Ping(ip netip.Addr, pingType tailcfg.PingType, size int, cb func(*ipnstate.PingResult)) {
 | 
						|
	e.watchdog("Ping", func() { e.wrap.Ping(ip, pingType, size, cb) })
 | 
						|
}
 | 
						|
func (e *watchdogEngine) Close() {
 | 
						|
	e.watchdog("Close", e.wrap.Close)
 | 
						|
}
 | 
						|
func (e *watchdogEngine) PeerForIP(ip netip.Addr) (ret PeerForIP, ok bool) {
 | 
						|
	e.watchdog("PeerForIP", func() { ret, ok = e.wrap.PeerForIP(ip) })
 | 
						|
	return ret, ok
 | 
						|
}
 | 
						|
 | 
						|
func (e *watchdogEngine) Wait() {
 | 
						|
	e.wrap.Wait()
 | 
						|
}
 | 
						|
 | 
						|
func (e *watchdogEngine) InstallCaptureHook(cb capture.Callback) {
 | 
						|
	e.wrap.InstallCaptureHook(cb)
 | 
						|
}
 |