| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794 |
- // Copyright (c) Tailscale Inc & AUTHORS
- // SPDX-License-Identifier: BSD-3-Clause
- package controlclient
- import (
- "bufio"
- "bytes"
- "context"
- "crypto/ed25519"
- "encoding/base64"
- "encoding/binary"
- "encoding/json"
- "errors"
- "fmt"
- "io"
- "log"
- "net/http"
- "net/http/httptest"
- "net/netip"
- "net/url"
- "os"
- "reflect"
- "runtime"
- "strings"
- "sync"
- "time"
- "go4.org/mem"
- "tailscale.com/control/controlknobs"
- "tailscale.com/envknob"
- "tailscale.com/health"
- "tailscale.com/hostinfo"
- "tailscale.com/ipn/ipnstate"
- "tailscale.com/log/logheap"
- "tailscale.com/logtail"
- "tailscale.com/net/dnscache"
- "tailscale.com/net/dnsfallback"
- "tailscale.com/net/interfaces"
- "tailscale.com/net/netmon"
- "tailscale.com/net/netutil"
- "tailscale.com/net/tlsdial"
- "tailscale.com/net/tsdial"
- "tailscale.com/net/tshttpproxy"
- "tailscale.com/syncs"
- "tailscale.com/tailcfg"
- "tailscale.com/tka"
- "tailscale.com/types/key"
- "tailscale.com/types/logger"
- "tailscale.com/types/netmap"
- "tailscale.com/types/opt"
- "tailscale.com/types/persist"
- "tailscale.com/types/tkatype"
- "tailscale.com/util/clientmetric"
- "tailscale.com/util/multierr"
- "tailscale.com/util/singleflight"
- "tailscale.com/util/systemd"
- )
- // Direct is the client that connects to a tailcontrol server for a node.
- type Direct struct {
- httpc *http.Client // HTTP client used to talk to tailcontrol
- dialer *tsdial.Dialer
- dnsCache *dnscache.Resolver
- serverURL string // URL of the tailcontrol server
- timeNow func() time.Time
- lastPrintMap time.Time
- newDecompressor func() (Decompressor, error)
- keepAlive bool
- logf logger.Logf
- netMon *netmon.Monitor // or nil
- discoPubKey key.DiscoPublic
- getMachinePrivKey func() (key.MachinePrivate, error)
- debugFlags []string
- keepSharerAndUserSplit bool
- skipIPForwardingCheck bool
- pinger Pinger
- popBrowser func(url string) // or nil
- c2nHandler http.Handler // or nil
- onClientVersion func(*tailcfg.ClientVersion) // or nil
- onControlTime func(time.Time) // or nil
- dialPlan ControlDialPlanner // can be nil
- mu sync.Mutex // mutex guards the following fields
- serverKey key.MachinePublic // original ("legacy") nacl crypto_box-based public key
- serverNoiseKey key.MachinePublic
- sfGroup singleflight.Group[struct{}, *NoiseClient] // protects noiseClient creation.
- noiseClient *NoiseClient
- persist persist.PersistView
- authKey string
- tryingNewKey key.NodePrivate
- expiry *time.Time
- hostinfo *tailcfg.Hostinfo // always non-nil
- netinfo *tailcfg.NetInfo
- endpoints []tailcfg.Endpoint
- tkaHead string
- lastPingURL string // last PingRequest.URL received, for dup suppression
- }
- type Options struct {
- Persist persist.Persist // initial persistent data
- GetMachinePrivateKey func() (key.MachinePrivate, error) // returns the machine key to use
- ServerURL string // URL of the tailcontrol server
- AuthKey string // optional node auth key for auto registration
- TimeNow func() time.Time // time.Now implementation used by Client
- Hostinfo *tailcfg.Hostinfo // non-nil passes ownership, nil means to use default using os.Hostname, etc
- DiscoPublicKey key.DiscoPublic
- NewDecompressor func() (Decompressor, error)
- KeepAlive bool
- Logf logger.Logf
- HTTPTestClient *http.Client // optional HTTP client to use (for tests only)
- NoiseTestClient *http.Client // optional HTTP client to use for noise RPCs (tests only)
- DebugFlags []string // debug settings to send to control
- NetMon *netmon.Monitor // optional network monitor
- PopBrowserURL func(url string) // optional func to open browser
- OnClientVersion func(*tailcfg.ClientVersion) // optional func to inform GUI of client version status
- OnControlTime func(time.Time) // optional func to notify callers of new time from control
- Dialer *tsdial.Dialer // non-nil
- C2NHandler http.Handler // or nil
- // Status is called when there's a change in status.
- Status func(Status)
- // KeepSharerAndUserSplit controls whether the client
- // understands Node.Sharer. If false, the Sharer is mapped to the User.
- KeepSharerAndUserSplit bool
- // SkipIPForwardingCheck declares that the host's IP
- // forwarding works and should not be double-checked by the
- // controlclient package.
- SkipIPForwardingCheck bool
- // Pinger optionally specifies the Pinger to use to satisfy
- // MapResponse.PingRequest queries from the control plane.
- // If nil, PingRequest queries are not answered.
- Pinger Pinger
- // DialPlan contains and stores a previous dial plan that we received
- // from the control server; if nil, we fall back to using DNS.
- //
- // If we receive a new DialPlan from the server, this value will be
- // updated.
- DialPlan ControlDialPlanner
- }
- // ControlDialPlanner is the interface optionally supplied when creating a
- // control client to control exactly how TCP connections to the control plane
- // are dialed.
- //
- // It is usually implemented by an atomic.Pointer.
- type ControlDialPlanner interface {
- // Load returns the current plan for how to connect to control.
- //
- // The returned plan can be nil. If so, connections should be made by
- // resolving the control URL using DNS.
- Load() *tailcfg.ControlDialPlan
- // Store updates the dial plan with new directions from the control
- // server.
- //
- // The dial plan can span multiple connections to the control server.
- // That is, a dial plan received when connected over Wi-Fi is still
- // valid for a subsequent connection over LTE after a network switch.
- Store(*tailcfg.ControlDialPlan)
- }
- // Pinger is the LocalBackend.Ping method.
- type Pinger interface {
- // Ping is a request to do a ping with the peer handling the given IP.
- Ping(ctx context.Context, ip netip.Addr, pingType tailcfg.PingType) (*ipnstate.PingResult, error)
- }
- type Decompressor interface {
- DecodeAll(input, dst []byte) ([]byte, error)
- Close()
- }
- // NewDirect returns a new Direct client.
- func NewDirect(opts Options) (*Direct, error) {
- if opts.ServerURL == "" {
- return nil, errors.New("controlclient.New: no server URL specified")
- }
- if opts.GetMachinePrivateKey == nil {
- return nil, errors.New("controlclient.New: no GetMachinePrivateKey specified")
- }
- opts.ServerURL = strings.TrimRight(opts.ServerURL, "/")
- serverURL, err := url.Parse(opts.ServerURL)
- if err != nil {
- return nil, err
- }
- if opts.TimeNow == nil {
- opts.TimeNow = time.Now
- }
- if opts.Logf == nil {
- // TODO(apenwarr): remove this default and fail instead.
- // TODO(bradfitz): ... but then it shouldn't be in Options.
- opts.Logf = log.Printf
- }
- dnsCache := &dnscache.Resolver{
- Forward: dnscache.Get().Forward, // use default cache's forwarder
- UseLastGood: true,
- LookupIPFallback: dnsfallback.MakeLookupFunc(opts.Logf, opts.NetMon),
- Logf: opts.Logf,
- NetMon: opts.NetMon,
- }
- httpc := opts.HTTPTestClient
- if httpc == nil && runtime.GOOS == "js" {
- // In js/wasm, net/http.Transport (as of Go 1.18) will
- // only use the browser's Fetch API if you're using
- // the DefaultClient (or a client without dial hooks
- // etc set).
- httpc = http.DefaultClient
- }
- if httpc == nil {
- tr := http.DefaultTransport.(*http.Transport).Clone()
- tr.Proxy = tshttpproxy.ProxyFromEnvironment
- tshttpproxy.SetTransportGetProxyConnectHeader(tr)
- tr.TLSClientConfig = tlsdial.Config(serverURL.Hostname(), tr.TLSClientConfig)
- tr.DialContext = dnscache.Dialer(opts.Dialer.SystemDial, dnsCache)
- tr.DialTLSContext = dnscache.TLSDialer(opts.Dialer.SystemDial, dnsCache, tr.TLSClientConfig)
- tr.ForceAttemptHTTP2 = true
- // Disable implicit gzip compression; the various
- // handlers (register, map, set-dns, etc) do their own
- // zstd compression per naclbox.
- tr.DisableCompression = true
- httpc = &http.Client{Transport: tr}
- }
- c := &Direct{
- httpc: httpc,
- getMachinePrivKey: opts.GetMachinePrivateKey,
- serverURL: opts.ServerURL,
- timeNow: opts.TimeNow,
- logf: opts.Logf,
- newDecompressor: opts.NewDecompressor,
- keepAlive: opts.KeepAlive,
- persist: opts.Persist.View(),
- authKey: opts.AuthKey,
- discoPubKey: opts.DiscoPublicKey,
- debugFlags: opts.DebugFlags,
- keepSharerAndUserSplit: opts.KeepSharerAndUserSplit,
- netMon: opts.NetMon,
- skipIPForwardingCheck: opts.SkipIPForwardingCheck,
- pinger: opts.Pinger,
- popBrowser: opts.PopBrowserURL,
- onClientVersion: opts.OnClientVersion,
- onControlTime: opts.OnControlTime,
- c2nHandler: opts.C2NHandler,
- dialer: opts.Dialer,
- dnsCache: dnsCache,
- dialPlan: opts.DialPlan,
- }
- if opts.Hostinfo == nil {
- c.SetHostinfo(hostinfo.New())
- } else {
- ni := opts.Hostinfo.NetInfo
- opts.Hostinfo.NetInfo = nil
- c.SetHostinfo(opts.Hostinfo)
- if ni != nil {
- c.SetNetInfo(ni)
- }
- }
- if opts.NoiseTestClient != nil {
- c.noiseClient = &NoiseClient{
- Client: opts.NoiseTestClient,
- }
- c.serverNoiseKey = key.NewMachine().Public() // prevent early error before hitting test client
- }
- return c, nil
- }
- // Close closes the underlying Noise connection(s).
- func (c *Direct) Close() error {
- c.mu.Lock()
- defer c.mu.Unlock()
- if c.noiseClient != nil {
- if err := c.noiseClient.Close(); err != nil {
- return err
- }
- }
- c.noiseClient = nil
- return nil
- }
- // SetHostinfo clones the provided Hostinfo and remembers it for the
- // next update. It reports whether the Hostinfo has changed.
- func (c *Direct) SetHostinfo(hi *tailcfg.Hostinfo) bool {
- if hi == nil {
- panic("nil Hostinfo")
- }
- c.mu.Lock()
- defer c.mu.Unlock()
- if hi.Equal(c.hostinfo) {
- return false
- }
- c.hostinfo = hi.Clone()
- j, _ := json.Marshal(c.hostinfo)
- c.logf("[v1] HostInfo: %s", j)
- return true
- }
- // SetNetInfo clones the provided NetInfo and remembers it for the
- // next update. It reports whether the NetInfo has changed.
- func (c *Direct) SetNetInfo(ni *tailcfg.NetInfo) bool {
- if ni == nil {
- panic("nil NetInfo")
- }
- c.mu.Lock()
- defer c.mu.Unlock()
- if reflect.DeepEqual(ni, c.netinfo) {
- return false
- }
- c.netinfo = ni.Clone()
- c.logf("NetInfo: %v", ni)
- return true
- }
- // SetNetInfo stores a new TKA head value for next update.
- // It reports whether the TKA head changed.
- func (c *Direct) SetTKAHead(tkaHead string) bool {
- c.mu.Lock()
- defer c.mu.Unlock()
- if tkaHead == c.tkaHead {
- return false
- }
- c.tkaHead = tkaHead
- c.logf("tkaHead: %v", tkaHead)
- return true
- }
- func (c *Direct) GetPersist() persist.PersistView {
- c.mu.Lock()
- defer c.mu.Unlock()
- return c.persist
- }
- func (c *Direct) TryLogout(ctx context.Context) error {
- c.logf("[v1] direct.TryLogout()")
- mustRegen, newURL, _, err := c.doLogin(ctx, loginOpt{Logout: true})
- c.logf("[v1] TryLogout control response: mustRegen=%v, newURL=%v, err=%v", mustRegen, newURL, err)
- c.mu.Lock()
- c.persist = new(persist.Persist).View()
- c.mu.Unlock()
- return err
- }
- func (c *Direct) TryLogin(ctx context.Context, t *tailcfg.Oauth2Token, flags LoginFlags) (url string, err error) {
- c.logf("[v1] direct.TryLogin(token=%v, flags=%v)", t != nil, flags)
- return c.doLoginOrRegen(ctx, loginOpt{Token: t, Flags: flags})
- }
- // WaitLoginURL sits in a long poll waiting for the user to authenticate at url.
- //
- // On success, newURL and err will both be nil.
- func (c *Direct) WaitLoginURL(ctx context.Context, url string) (newURL string, err error) {
- c.logf("[v1] direct.WaitLoginURL")
- return c.doLoginOrRegen(ctx, loginOpt{URL: url})
- }
- func (c *Direct) doLoginOrRegen(ctx context.Context, opt loginOpt) (newURL string, err error) {
- mustRegen, url, oldNodeKeySignature, err := c.doLogin(ctx, opt)
- if err != nil {
- return url, err
- }
- if mustRegen {
- opt.Regen = true
- opt.OldNodeKeySignature = oldNodeKeySignature
- _, url, _, err = c.doLogin(ctx, opt)
- }
- return url, err
- }
- // SetExpirySooner attempts to shorten the expiry to the specified time.
- func (c *Direct) SetExpirySooner(ctx context.Context, expiry time.Time) error {
- c.logf("[v1] direct.SetExpirySooner()")
- newURL, err := c.doLoginOrRegen(ctx, loginOpt{Expiry: &expiry})
- c.logf("[v1] SetExpirySooner control response: newURL=%v, err=%v", newURL, err)
- return err
- }
- type loginOpt struct {
- Token *tailcfg.Oauth2Token
- Flags LoginFlags
- Regen bool // generate a new nodekey, can be overridden in doLogin
- URL string
- Logout bool // set the expiry to the far past, expiring the node
- // Expiry, if non-nil, attempts to set the node expiry to the
- // specified time and cannot be used to extend the expiry.
- // It is ignored if Logout is set since Logout works by setting a
- // expiry time in the far past.
- Expiry *time.Time
- // OldNodeKeySignature indicates the former NodeKeySignature
- // that must be resigned for the new node-key.
- OldNodeKeySignature tkatype.MarshaledSignature
- }
- // httpClient provides a common interface for the noiseClient and
- // the NaCl box http.Client.
- type httpClient interface {
- Do(req *http.Request) (*http.Response, error)
- }
- // hostInfoLocked returns a Clone of c.hostinfo and c.netinfo.
- // It must only be called with c.mu held.
- func (c *Direct) hostInfoLocked() *tailcfg.Hostinfo {
- hi := c.hostinfo.Clone()
- hi.NetInfo = c.netinfo.Clone()
- return hi
- }
- func (c *Direct) doLogin(ctx context.Context, opt loginOpt) (mustRegen bool, newURL string, nks tkatype.MarshaledSignature, err error) {
- c.mu.Lock()
- persist := c.persist.AsStruct()
- tryingNewKey := c.tryingNewKey
- serverKey := c.serverKey
- serverNoiseKey := c.serverNoiseKey
- authKey, isWrapped, wrappedSig, wrappedKey := decodeWrappedAuthkey(c.authKey, c.logf)
- hi := c.hostInfoLocked()
- backendLogID := hi.BackendLogID
- expired := c.expiry != nil && !c.expiry.IsZero() && c.expiry.Before(c.timeNow())
- c.mu.Unlock()
- machinePrivKey, err := c.getMachinePrivKey()
- if err != nil {
- return false, "", nil, fmt.Errorf("getMachinePrivKey: %w", err)
- }
- if machinePrivKey.IsZero() {
- return false, "", nil, errors.New("getMachinePrivKey returned zero key")
- }
- regen := opt.Regen
- if opt.Logout {
- c.logf("logging out...")
- } else {
- if expired {
- c.logf("Old key expired -> regen=true")
- systemd.Status("key expired; run 'tailscale up' to authenticate")
- regen = true
- }
- if (opt.Flags & LoginInteractive) != 0 {
- c.logf("LoginInteractive -> regen=true")
- regen = true
- }
- }
- c.logf("doLogin(regen=%v, hasUrl=%v)", regen, opt.URL != "")
- if serverKey.IsZero() {
- keys, err := loadServerPubKeys(ctx, c.httpc, c.serverURL)
- if err != nil {
- return regen, opt.URL, nil, err
- }
- c.logf("control server key from %s: ts2021=%s, legacy=%v", c.serverURL, keys.PublicKey.ShortString(), keys.LegacyPublicKey.ShortString())
- c.mu.Lock()
- c.serverKey = keys.LegacyPublicKey
- c.serverNoiseKey = keys.PublicKey
- c.mu.Unlock()
- serverKey = keys.LegacyPublicKey
- serverNoiseKey = keys.PublicKey
- // For servers supporting the Noise transport,
- // proactively shut down our TLS TCP connection.
- // We're not going to need it and it's nicer to the
- // server.
- if !serverNoiseKey.IsZero() {
- c.httpc.CloseIdleConnections()
- }
- }
- var oldNodeKey key.NodePublic
- switch {
- case opt.Logout:
- tryingNewKey = persist.PrivateNodeKey
- case opt.URL != "":
- // Nothing.
- case regen || persist.PrivateNodeKey.IsZero():
- c.logf("Generating a new nodekey.")
- persist.OldPrivateNodeKey = persist.PrivateNodeKey
- tryingNewKey = key.NewNode()
- default:
- // Try refreshing the current key first
- tryingNewKey = persist.PrivateNodeKey
- }
- if !persist.OldPrivateNodeKey.IsZero() {
- oldNodeKey = persist.OldPrivateNodeKey.Public()
- }
- if persist.NetworkLockKey.IsZero() {
- persist.NetworkLockKey = key.NewNLPrivate()
- }
- nlPub := persist.NetworkLockKey.Public()
- if tryingNewKey.IsZero() {
- if opt.Logout {
- return false, "", nil, errors.New("no nodekey to log out")
- }
- log.Fatalf("tryingNewKey is empty, give up")
- }
- var nodeKeySignature tkatype.MarshaledSignature
- if !oldNodeKey.IsZero() && opt.OldNodeKeySignature != nil {
- if nodeKeySignature, err = resignNKS(persist.NetworkLockKey, tryingNewKey.Public(), opt.OldNodeKeySignature); err != nil {
- c.logf("Failed re-signing node-key signature: %v", err)
- }
- } else if isWrapped {
- // We were given a wrapped pre-auth key, which means that in addition
- // to being a regular pre-auth key there was a suffix with information to
- // generate a tailnet-lock signature.
- nk, err := tryingNewKey.Public().MarshalBinary()
- if err != nil {
- return false, "", nil, fmt.Errorf("marshalling node-key: %w", err)
- }
- sig := &tka.NodeKeySignature{
- SigKind: tka.SigRotation,
- Pubkey: nk,
- Nested: wrappedSig,
- }
- sigHash := sig.SigHash()
- sig.Signature = ed25519.Sign(wrappedKey, sigHash[:])
- nodeKeySignature = sig.Serialize()
- }
- if backendLogID == "" {
- err = errors.New("hostinfo: BackendLogID missing")
- return regen, opt.URL, nil, err
- }
- now := time.Now().Round(time.Second)
- request := tailcfg.RegisterRequest{
- Version: 1,
- OldNodeKey: oldNodeKey,
- NodeKey: tryingNewKey.Public(),
- NLKey: nlPub,
- Hostinfo: hi,
- Followup: opt.URL,
- Timestamp: &now,
- Ephemeral: (opt.Flags & LoginEphemeral) != 0,
- NodeKeySignature: nodeKeySignature,
- }
- if opt.Logout {
- request.Expiry = time.Unix(123, 0) // far in the past
- } else if opt.Expiry != nil {
- request.Expiry = *opt.Expiry
- }
- c.logf("RegisterReq: onode=%v node=%v fup=%v nks=%v",
- request.OldNodeKey.ShortString(),
- request.NodeKey.ShortString(), opt.URL != "", len(nodeKeySignature) > 0)
- request.Auth.Oauth2Token = opt.Token
- request.Auth.Provider = persist.Provider
- request.Auth.LoginName = persist.LoginName
- request.Auth.AuthKey = authKey
- err = signRegisterRequest(&request, c.serverURL, c.serverKey, machinePrivKey.Public())
- if err != nil {
- // If signing failed, clear all related fields
- request.SignatureType = tailcfg.SignatureNone
- request.Timestamp = nil
- request.DeviceCert = nil
- request.Signature = nil
- // Don't log the common error types. Signatures are not usually enabled,
- // so these are expected.
- if !errors.Is(err, errCertificateNotConfigured) && !errors.Is(err, errNoCertStore) {
- c.logf("RegisterReq sign error: %v", err)
- }
- }
- if debugRegister() {
- j, _ := json.MarshalIndent(request, "", "\t")
- c.logf("RegisterRequest: %s", j)
- }
- // URL and httpc are protocol specific.
- var url string
- var httpc httpClient
- if serverNoiseKey.IsZero() {
- httpc = c.httpc
- url = fmt.Sprintf("%s/machine/%s", c.serverURL, machinePrivKey.Public().UntypedHexString())
- } else {
- request.Version = tailcfg.CurrentCapabilityVersion
- httpc, err = c.getNoiseClient()
- if err != nil {
- return regen, opt.URL, nil, fmt.Errorf("getNoiseClient: %w", err)
- }
- url = fmt.Sprintf("%s/machine/register", c.serverURL)
- url = strings.Replace(url, "http:", "https:", 1)
- }
- bodyData, err := encode(request, serverKey, serverNoiseKey, machinePrivKey)
- if err != nil {
- return regen, opt.URL, nil, err
- }
- req, err := http.NewRequestWithContext(ctx, "POST", url, bytes.NewReader(bodyData))
- if err != nil {
- return regen, opt.URL, nil, err
- }
- res, err := httpc.Do(req)
- if err != nil {
- return regen, opt.URL, nil, fmt.Errorf("register request: %w", err)
- }
- if res.StatusCode != 200 {
- msg, _ := io.ReadAll(res.Body)
- res.Body.Close()
- return regen, opt.URL, nil, fmt.Errorf("register request: http %d: %.200s",
- res.StatusCode, strings.TrimSpace(string(msg)))
- }
- resp := tailcfg.RegisterResponse{}
- if err := decode(res, &resp, serverKey, serverNoiseKey, machinePrivKey); err != nil {
- c.logf("error decoding RegisterResponse with server key %s and machine key %s: %v", serverKey, machinePrivKey.Public(), err)
- return regen, opt.URL, nil, fmt.Errorf("register request: %v", err)
- }
- if debugRegister() {
- j, _ := json.MarshalIndent(resp, "", "\t")
- c.logf("RegisterResponse: %s", j)
- }
- // Log without PII:
- c.logf("RegisterReq: got response; nodeKeyExpired=%v, machineAuthorized=%v; authURL=%v",
- resp.NodeKeyExpired, resp.MachineAuthorized, resp.AuthURL != "")
- if resp.Error != "" {
- return false, "", nil, UserVisibleError(resp.Error)
- }
- if len(resp.NodeKeySignature) > 0 {
- return true, "", resp.NodeKeySignature, nil
- }
- if resp.NodeKeyExpired {
- if regen {
- return true, "", nil, fmt.Errorf("weird: regen=true but server says NodeKeyExpired: %v", request.NodeKey)
- }
- c.logf("server reports new node key %v has expired",
- request.NodeKey.ShortString())
- return true, "", nil, nil
- }
- if resp.Login.Provider != "" {
- persist.Provider = resp.Login.Provider
- }
- if resp.Login.LoginName != "" {
- persist.LoginName = resp.Login.LoginName
- }
- persist.UserProfile = tailcfg.UserProfile{
- ID: resp.User.ID,
- DisplayName: resp.Login.DisplayName,
- ProfilePicURL: resp.Login.ProfilePicURL,
- LoginName: resp.Login.LoginName,
- }
- // TODO(crawshaw): RegisterResponse should be able to mechanically
- // communicate some extra instructions from the server:
- // - new node key required
- // - machine key no longer supported
- // - user is disabled
- if resp.AuthURL != "" {
- c.logf("AuthURL is %v", resp.AuthURL)
- } else {
- c.logf("[v1] No AuthURL")
- }
- c.mu.Lock()
- if resp.AuthURL == "" {
- // key rotation is complete
- persist.PrivateNodeKey = tryingNewKey
- } else {
- // save it for the retry-with-URL
- c.tryingNewKey = tryingNewKey
- }
- c.persist = persist.View()
- c.mu.Unlock()
- if err != nil {
- return regen, "", nil, err
- }
- if ctx.Err() != nil {
- return regen, "", nil, ctx.Err()
- }
- return false, resp.AuthURL, nil, nil
- }
- // resignNKS re-signs a node-key signature for a new node-key.
- //
- // This only matters on network-locked tailnets, because node-key signatures are
- // how other nodes know that a node-key is authentic. When the node-key is
- // rotated then the existing signature becomes invalid, so this function is
- // responsible for generating a new wrapping signature to certify the new node-key.
- //
- // The signature itself is a SigRotation signature, which embeds the old signature
- // and certifies the new node-key as a replacement for the old by signing the new
- // signature with RotationPubkey (which is the node's own network-lock key).
- func resignNKS(priv key.NLPrivate, nodeKey key.NodePublic, oldNKS tkatype.MarshaledSignature) (tkatype.MarshaledSignature, error) {
- var oldSig tka.NodeKeySignature
- if err := oldSig.Unserialize(oldNKS); err != nil {
- return nil, fmt.Errorf("decoding NKS: %w", err)
- }
- nk, err := nodeKey.MarshalBinary()
- if err != nil {
- return nil, fmt.Errorf("marshalling node-key: %w", err)
- }
- if bytes.Equal(nk, oldSig.Pubkey) {
- // The old signature is valid for the node-key we are using, so just
- // use it verbatim.
- return oldNKS, nil
- }
- newSig := tka.NodeKeySignature{
- SigKind: tka.SigRotation,
- Pubkey: nk,
- Nested: &oldSig,
- }
- if newSig.Signature, err = priv.SignNKS(newSig.SigHash()); err != nil {
- return nil, fmt.Errorf("signing NKS: %w", err)
- }
- return newSig.Serialize(), nil
- }
- func sameEndpoints(a, b []tailcfg.Endpoint) bool {
- if len(a) != len(b) {
- return false
- }
- for i := range a {
- if a[i] != b[i] {
- return false
- }
- }
- return true
- }
- // newEndpoints acquires c.mu and sets the local port and endpoints and reports
- // whether they've changed.
- //
- // It does not retain the provided slice.
- func (c *Direct) newEndpoints(endpoints []tailcfg.Endpoint) (changed bool) {
- c.mu.Lock()
- defer c.mu.Unlock()
- // Nothing new?
- if sameEndpoints(c.endpoints, endpoints) {
- return false // unchanged
- }
- var epStrs []string
- for _, ep := range endpoints {
- epStrs = append(epStrs, ep.Addr.String())
- }
- c.logf("[v2] client.newEndpoints(%v)", epStrs)
- c.endpoints = append(c.endpoints[:0], endpoints...)
- return true // changed
- }
- // SetEndpoints updates the list of locally advertised endpoints.
- // It won't be replicated to the server until a *fresh* call to PollNetMap().
- // You don't need to restart PollNetMap if we return changed==false.
- func (c *Direct) SetEndpoints(endpoints []tailcfg.Endpoint) (changed bool) {
- // (no log message on function entry, because it clutters the logs
- // if endpoints haven't changed. newEndpoints() will log it.)
- return c.newEndpoints(endpoints)
- }
- // PollNetMap makes a /map request to download the network map, calling cb with
- // each new netmap.
- func (c *Direct) PollNetMap(ctx context.Context, cb func(*netmap.NetworkMap)) error {
- return c.sendMapRequest(ctx, -1, false, cb)
- }
- // FetchNetMap fetches the netmap once.
- func (c *Direct) FetchNetMap(ctx context.Context) (*netmap.NetworkMap, error) {
- var ret *netmap.NetworkMap
- err := c.sendMapRequest(ctx, 1, false, func(nm *netmap.NetworkMap) {
- ret = nm
- })
- if err == nil && ret == nil {
- return nil, errors.New("[unexpected] sendMapRequest success without callback")
- }
- return ret, err
- }
- // SendLiteMapUpdate makes a /map request to update the server of our latest state,
- // but does not fetch anything. It returns an error if the server did not return a
- // successful 200 OK response.
- func (c *Direct) SendLiteMapUpdate(ctx context.Context) error {
- return c.sendMapRequest(ctx, 1, false, nil)
- }
- // If we go more than pollTimeout without hearing from the server,
- // end the long poll. We should be receiving a keep alive ping
- // every minute.
- const pollTimeout = 120 * time.Second
- // cb nil means to omit peers.
- func (c *Direct) sendMapRequest(ctx context.Context, maxPolls int, readOnly bool, cb func(*netmap.NetworkMap)) error {
- metricMapRequests.Add(1)
- metricMapRequestsActive.Add(1)
- defer metricMapRequestsActive.Add(-1)
- if maxPolls == -1 {
- metricMapRequestsPoll.Add(1)
- } else {
- metricMapRequestsLite.Add(1)
- }
- c.mu.Lock()
- persist := c.persist
- serverURL := c.serverURL
- serverKey := c.serverKey
- serverNoiseKey := c.serverNoiseKey
- hi := c.hostInfoLocked()
- backendLogID := hi.BackendLogID
- var epStrs []string
- var epTypes []tailcfg.EndpointType
- for _, ep := range c.endpoints {
- epStrs = append(epStrs, ep.Addr.String())
- epTypes = append(epTypes, ep.Type)
- }
- c.mu.Unlock()
- machinePrivKey, err := c.getMachinePrivKey()
- if err != nil {
- return fmt.Errorf("getMachinePrivKey: %w", err)
- }
- if machinePrivKey.IsZero() {
- return errors.New("getMachinePrivKey returned zero key")
- }
- if persist.PrivateNodeKey().IsZero() {
- return errors.New("privateNodeKey is zero")
- }
- if backendLogID == "" {
- return errors.New("hostinfo: BackendLogID missing")
- }
- allowStream := maxPolls != 1
- c.logf("[v1] PollNetMap: stream=%v ep=%v", allowStream, epStrs)
- vlogf := logger.Discard
- if DevKnob.DumpNetMaps() {
- // TODO(bradfitz): update this to use "[v2]" prefix perhaps? but we don't
- // want to upload it always.
- vlogf = c.logf
- }
- request := &tailcfg.MapRequest{
- Version: tailcfg.CurrentCapabilityVersion,
- KeepAlive: c.keepAlive,
- NodeKey: persist.PublicNodeKey(),
- DiscoKey: c.discoPubKey,
- Endpoints: epStrs,
- EndpointTypes: epTypes,
- Stream: allowStream,
- Hostinfo: hi,
- DebugFlags: c.debugFlags,
- OmitPeers: cb == nil,
- TKAHead: c.tkaHead,
- // Previously we'd set ReadOnly to true if we didn't have any endpoints
- // yet as we expected to learn them in a half second and restart the full
- // streaming map poll, however as we are trying to reduce the number of
- // times we restart the full streaming map poll we now just set ReadOnly
- // false when we're doing a full streaming map poll.
- //
- // TODO(maisem/bradfitz): really ReadOnly should be set to true if for
- // all streams and we should only do writes via lite map updates.
- // However that requires an audit and a bunch of testing to make sure we
- // don't break anything.
- ReadOnly: readOnly && !allowStream,
- }
- var extraDebugFlags []string
- if hi != nil && c.netMon != nil && !c.skipIPForwardingCheck &&
- ipForwardingBroken(hi.RoutableIPs, c.netMon.InterfaceState()) {
- extraDebugFlags = append(extraDebugFlags, "warn-ip-forwarding-off")
- }
- if health.RouterHealth() != nil {
- extraDebugFlags = append(extraDebugFlags, "warn-router-unhealthy")
- }
- extraDebugFlags = health.AppendWarnableDebugFlags(extraDebugFlags)
- if hostinfo.DisabledEtcAptSource() {
- extraDebugFlags = append(extraDebugFlags, "warn-etc-apt-source-disabled")
- }
- if len(extraDebugFlags) > 0 {
- old := request.DebugFlags
- request.DebugFlags = append(old[:len(old):len(old)], extraDebugFlags...)
- }
- if c.newDecompressor != nil {
- request.Compress = "zstd"
- }
- bodyData, err := encode(request, serverKey, serverNoiseKey, machinePrivKey)
- if err != nil {
- vlogf("netmap: encode: %v", err)
- return err
- }
- ctx, cancel := context.WithCancel(ctx)
- defer cancel()
- machinePubKey := machinePrivKey.Public()
- t0 := time.Now()
- // Url and httpc are protocol specific.
- var url string
- var httpc httpClient
- if serverNoiseKey.IsZero() {
- httpc = c.httpc
- url = fmt.Sprintf("%s/machine/%s/map", serverURL, machinePubKey.UntypedHexString())
- } else {
- httpc, err = c.getNoiseClient()
- if err != nil {
- return fmt.Errorf("getNoiseClient: %w", err)
- }
- url = fmt.Sprintf("%s/machine/map", serverURL)
- url = strings.Replace(url, "http:", "https:", 1)
- }
- req, err := http.NewRequestWithContext(ctx, "POST", url, bytes.NewReader(bodyData))
- if err != nil {
- return err
- }
- res, err := httpc.Do(req)
- if err != nil {
- vlogf("netmap: Do: %v", err)
- return err
- }
- vlogf("netmap: Do = %v after %v", res.StatusCode, time.Since(t0).Round(time.Millisecond))
- if res.StatusCode != 200 {
- msg, _ := io.ReadAll(res.Body)
- res.Body.Close()
- return fmt.Errorf("initial fetch failed %d: %.200s",
- res.StatusCode, strings.TrimSpace(string(msg)))
- }
- defer res.Body.Close()
- health.NoteMapRequestHeard(request)
- if cb == nil {
- io.Copy(io.Discard, res.Body)
- return nil
- }
- timeout := time.NewTimer(pollTimeout)
- timeoutReset := make(chan struct{})
- pollDone := make(chan struct{})
- defer close(pollDone)
- go func() {
- for {
- select {
- case <-pollDone:
- vlogf("netmap: ending timeout goroutine")
- return
- case <-timeout.C:
- c.logf("map response long-poll timed out!")
- cancel()
- return
- case <-timeoutReset:
- if !timeout.Stop() {
- select {
- case <-timeout.C:
- case <-pollDone:
- vlogf("netmap: ending timeout goroutine")
- return
- }
- }
- vlogf("netmap: reset timeout timer")
- timeout.Reset(pollTimeout)
- }
- }
- }()
- sess := newMapSession(persist.PrivateNodeKey())
- sess.logf = c.logf
- sess.vlogf = vlogf
- sess.machinePubKey = machinePubKey
- sess.keepSharerAndUserSplit = c.keepSharerAndUserSplit
- // If allowStream, then the server will use an HTTP long poll to
- // return incremental results. There is always one response right
- // away, followed by a delay, and eventually others.
- // If !allowStream, it'll still send the first result in exactly
- // the same format before just closing the connection.
- // We can use this same read loop either way.
- var msg []byte
- for i := 0; i < maxPolls || maxPolls < 0; i++ {
- vlogf("netmap: starting size read after %v (poll %v)", time.Since(t0).Round(time.Millisecond), i)
- var siz [4]byte
- if _, err := io.ReadFull(res.Body, siz[:]); err != nil {
- vlogf("netmap: size read error after %v: %v", time.Since(t0).Round(time.Millisecond), err)
- return err
- }
- size := binary.LittleEndian.Uint32(siz[:])
- vlogf("netmap: read size %v after %v", size, time.Since(t0).Round(time.Millisecond))
- msg = append(msg[:0], make([]byte, size)...)
- if _, err := io.ReadFull(res.Body, msg); err != nil {
- vlogf("netmap: body read error: %v", err)
- return err
- }
- vlogf("netmap: read body after %v", time.Since(t0).Round(time.Millisecond))
- var resp tailcfg.MapResponse
- if err := c.decodeMsg(msg, &resp, machinePrivKey); err != nil {
- vlogf("netmap: decode error: %v")
- return err
- }
- metricMapResponseMessages.Add(1)
- if allowStream {
- health.GotStreamedMapResponse()
- }
- if pr := resp.PingRequest; pr != nil && c.isUniquePingRequest(pr) {
- metricMapResponsePings.Add(1)
- go c.answerPing(pr)
- }
- if u := resp.PopBrowserURL; u != "" && u != sess.lastPopBrowserURL {
- sess.lastPopBrowserURL = u
- if c.popBrowser != nil {
- c.logf("netmap: control says to open URL %v; opening...", u)
- c.popBrowser(u)
- } else {
- c.logf("netmap: control says to open URL %v; no popBrowser func", u)
- }
- }
- if resp.ClientVersion != nil && c.onClientVersion != nil {
- c.onClientVersion(resp.ClientVersion)
- }
- if resp.ControlTime != nil && !resp.ControlTime.IsZero() {
- c.logf.JSON(1, "controltime", resp.ControlTime.UTC())
- if c.onControlTime != nil {
- c.onControlTime(*resp.ControlTime)
- }
- }
- if resp.KeepAlive {
- vlogf("netmap: got keep-alive")
- } else {
- vlogf("netmap: got new map")
- }
- if resp.ControlDialPlan != nil {
- if c.dialPlan != nil {
- c.logf("netmap: got new dial plan from control")
- c.dialPlan.Store(resp.ControlDialPlan)
- } else {
- c.logf("netmap: [unexpected] new dial plan; nowhere to store it")
- }
- }
- select {
- case timeoutReset <- struct{}{}:
- vlogf("netmap: sent timer reset")
- case <-ctx.Done():
- c.logf("[v1] netmap: not resetting timer; context done: %v", ctx.Err())
- return ctx.Err()
- }
- if resp.KeepAlive {
- metricMapResponseKeepAlives.Add(1)
- continue
- }
- metricMapResponseMap.Add(1)
- if i > 0 {
- metricMapResponseMapDelta.Add(1)
- }
- hasDebug := resp.Debug != nil
- // being conservative here, if Debug not present set to False
- controlknobs.SetDisableUPnP(hasDebug && resp.Debug.DisableUPnP.EqualBool(true))
- if hasDebug {
- if code := resp.Debug.Exit; code != nil {
- c.logf("exiting process with status %v per controlplane", *code)
- os.Exit(*code)
- }
- if resp.Debug.DisableLogTail {
- logtail.Disable()
- envknob.SetNoLogsNoSupport()
- }
- if resp.Debug.LogHeapPprof {
- go logheap.LogHeap(resp.Debug.LogHeapURL)
- }
- if resp.Debug.GoroutineDumpURL != "" {
- go dumpGoroutinesToURL(c.httpc, resp.Debug.GoroutineDumpURL)
- }
- if sleep := time.Duration(resp.Debug.SleepSeconds * float64(time.Second)); sleep > 0 {
- if err := sleepAsRequested(ctx, c.logf, timeoutReset, sleep); err != nil {
- return err
- }
- }
- }
- nm := sess.netmapForResponse(&resp)
- if nm.SelfNode == nil {
- c.logf("MapResponse lacked node")
- return errors.New("MapResponse lacked node")
- }
- if d := nm.Debug; d != nil {
- controlUseDERPRoute.Store(d.DERPRoute)
- controlTrimWGConfig.Store(d.TrimWGConfig)
- }
- if DevKnob.StripEndpoints() {
- for _, p := range resp.Peers {
- p.Endpoints = nil
- }
- }
- if DevKnob.StripCaps() {
- nm.SelfNode.Capabilities = nil
- }
- // Occasionally print the netmap header.
- // This is handy for debugging, and our logs processing
- // pipeline depends on it. (TODO: Remove this dependency.)
- // Code elsewhere prints netmap diffs every time they are received.
- now := c.timeNow()
- if now.Sub(c.lastPrintMap) >= 5*time.Minute {
- c.lastPrintMap = now
- c.logf("[v1] new network map[%d]:\n%s", i, nm.VeryConcise())
- }
- c.mu.Lock()
- c.expiry = &nm.Expiry
- c.mu.Unlock()
- cb(nm)
- }
- if ctx.Err() != nil {
- return ctx.Err()
- }
- return nil
- }
- // decode JSON decodes the res.Body into v. If serverNoiseKey is not specified,
- // it uses the serverKey and mkey to decode the message from the NaCl-crypto-box.
- func decode(res *http.Response, v any, serverKey, serverNoiseKey key.MachinePublic, mkey key.MachinePrivate) error {
- defer res.Body.Close()
- msg, err := io.ReadAll(io.LimitReader(res.Body, 1<<20))
- if err != nil {
- return err
- }
- if res.StatusCode != 200 {
- return fmt.Errorf("%d: %v", res.StatusCode, string(msg))
- }
- if !serverNoiseKey.IsZero() {
- return json.Unmarshal(msg, v)
- }
- return decodeMsg(msg, v, serverKey, mkey)
- }
- var (
- debugMap = envknob.RegisterBool("TS_DEBUG_MAP")
- debugRegister = envknob.RegisterBool("TS_DEBUG_REGISTER")
- )
- var jsonEscapedZero = []byte(`\u0000`)
- // decodeMsg is responsible for uncompressing msg and unmarshaling into v.
- // If c.serverNoiseKey is not specified, it uses the c.serverKey and mkey
- // to first the decrypt msg from the NaCl-crypto-box.
- func (c *Direct) decodeMsg(msg []byte, v any, mkey key.MachinePrivate) error {
- c.mu.Lock()
- serverKey := c.serverKey
- serverNoiseKey := c.serverNoiseKey
- c.mu.Unlock()
- var decrypted []byte
- if serverNoiseKey.IsZero() {
- var ok bool
- decrypted, ok = mkey.OpenFrom(serverKey, msg)
- if !ok {
- return errors.New("cannot decrypt response")
- }
- } else {
- decrypted = msg
- }
- var b []byte
- if c.newDecompressor == nil {
- b = decrypted
- } else {
- decoder, err := c.newDecompressor()
- if err != nil {
- return err
- }
- defer decoder.Close()
- b, err = decoder.DecodeAll(decrypted, nil)
- if err != nil {
- return err
- }
- }
- if debugMap() {
- var buf bytes.Buffer
- json.Indent(&buf, b, "", " ")
- log.Printf("MapResponse: %s", buf.Bytes())
- }
- if bytes.Contains(b, jsonEscapedZero) {
- log.Printf("[unexpected] zero byte in controlclient.Direct.decodeMsg into %T: %q", v, b)
- }
- if err := json.Unmarshal(b, v); err != nil {
- return fmt.Errorf("response: %v", err)
- }
- return nil
- }
- func decodeMsg(msg []byte, v any, serverKey key.MachinePublic, machinePrivKey key.MachinePrivate) error {
- decrypted, ok := machinePrivKey.OpenFrom(serverKey, msg)
- if !ok {
- return errors.New("cannot decrypt response")
- }
- if bytes.Contains(decrypted, jsonEscapedZero) {
- log.Printf("[unexpected] zero byte in controlclient decodeMsg into %T: %q", v, decrypted)
- }
- if err := json.Unmarshal(decrypted, v); err != nil {
- return fmt.Errorf("response: %v", err)
- }
- return nil
- }
- // encode JSON encodes v. If serverNoiseKey is not specified, it uses the serverKey and mkey to
- // seal the message into a NaCl-crypto-box.
- func encode(v any, serverKey, serverNoiseKey key.MachinePublic, mkey key.MachinePrivate) ([]byte, error) {
- b, err := json.Marshal(v)
- if err != nil {
- return nil, err
- }
- if debugMap() {
- if _, ok := v.(*tailcfg.MapRequest); ok {
- log.Printf("MapRequest: %s", b)
- }
- }
- if !serverNoiseKey.IsZero() {
- return b, nil
- }
- return mkey.SealTo(serverKey, b), nil
- }
- func loadServerPubKeys(ctx context.Context, httpc *http.Client, serverURL string) (*tailcfg.OverTLSPublicKeyResponse, error) {
- keyURL := fmt.Sprintf("%v/key?v=%d", serverURL, tailcfg.CurrentCapabilityVersion)
- req, err := http.NewRequestWithContext(ctx, "GET", keyURL, nil)
- if err != nil {
- return nil, fmt.Errorf("create control key request: %v", err)
- }
- res, err := httpc.Do(req)
- if err != nil {
- return nil, fmt.Errorf("fetch control key: %v", err)
- }
- defer res.Body.Close()
- b, err := io.ReadAll(io.LimitReader(res.Body, 64<<10))
- if err != nil {
- return nil, fmt.Errorf("fetch control key response: %v", err)
- }
- if res.StatusCode != 200 {
- return nil, fmt.Errorf("fetch control key: %d", res.StatusCode)
- }
- var out tailcfg.OverTLSPublicKeyResponse
- jsonErr := json.Unmarshal(b, &out)
- if jsonErr == nil {
- return &out, nil
- }
- // Some old control servers might not be updated to send the new format.
- // Accept the old pre-JSON format too.
- out = tailcfg.OverTLSPublicKeyResponse{}
- k, err := key.ParseMachinePublicUntyped(mem.B(b))
- if err != nil {
- return nil, multierr.New(jsonErr, err)
- }
- out.LegacyPublicKey = k
- return &out, nil
- }
- // DevKnob contains temporary internal-only debug knobs.
- // They're unexported to not draw attention to them.
- var DevKnob = initDevKnob()
- type devKnobs struct {
- DumpNetMaps func() bool
- ForceProxyDNS func() bool
- StripEndpoints func() bool // strip endpoints from control (only use disco messages)
- StripCaps func() bool // strip all local node's control-provided capabilities
- }
- func initDevKnob() devKnobs {
- return devKnobs{
- DumpNetMaps: envknob.RegisterBool("TS_DEBUG_NETMAP"),
- ForceProxyDNS: envknob.RegisterBool("TS_DEBUG_PROXY_DNS"),
- StripEndpoints: envknob.RegisterBool("TS_DEBUG_STRIP_ENDPOINTS"),
- StripCaps: envknob.RegisterBool("TS_DEBUG_STRIP_CAPS"),
- }
- }
- var clockNow = time.Now
- // opt.Bool configs from control.
- var (
- controlUseDERPRoute syncs.AtomicValue[opt.Bool]
- controlTrimWGConfig syncs.AtomicValue[opt.Bool]
- )
- // DERPRouteFlag reports the last reported value from control for whether
- // DERP route optimization (Issue 150) should be enabled.
- func DERPRouteFlag() opt.Bool {
- return controlUseDERPRoute.Load()
- }
- // TrimWGConfig reports the last reported value from control for whether
- // we should do lazy wireguard configuration.
- func TrimWGConfig() opt.Bool {
- return controlTrimWGConfig.Load()
- }
- // ipForwardingBroken reports whether the system's IP forwarding is disabled
- // and will definitely not work for the routes provided.
- //
- // It should not return false positives.
- //
- // TODO(bradfitz): Change controlclient.Options.SkipIPForwardingCheck into a
- // func([]netip.Prefix) error signature instead.
- func ipForwardingBroken(routes []netip.Prefix, state *interfaces.State) bool {
- warn, err := netutil.CheckIPForwarding(routes, state)
- if err != nil {
- // Oh well, we tried. This is just for debugging.
- // We don't want false positives.
- // TODO: maybe we want a different warning for inability to check?
- return false
- }
- return warn != nil
- }
- // isUniquePingRequest reports whether pr contains a new PingRequest.URL
- // not already handled, noting its value when returning true.
- func (c *Direct) isUniquePingRequest(pr *tailcfg.PingRequest) bool {
- if pr == nil || pr.URL == "" {
- // Bogus.
- return false
- }
- c.mu.Lock()
- defer c.mu.Unlock()
- if pr.URL == c.lastPingURL {
- return false
- }
- c.lastPingURL = pr.URL
- return true
- }
- func (c *Direct) answerPing(pr *tailcfg.PingRequest) {
- httpc := c.httpc
- useNoise := pr.URLIsNoise || pr.Types == "c2n" && c.noiseConfigured()
- if useNoise {
- nc, err := c.getNoiseClient()
- if err != nil {
- c.logf("failed to get noise client for ping request: %v", err)
- return
- }
- httpc = nc.Client
- }
- if pr.URL == "" {
- c.logf("invalid PingRequest with no URL")
- return
- }
- switch pr.Types {
- case "":
- answerHeadPing(c.logf, httpc, pr)
- return
- case "c2n":
- if !useNoise && !envknob.Bool("TS_DEBUG_PERMIT_HTTP_C2N") {
- c.logf("refusing to answer c2n ping without noise")
- return
- }
- answerC2NPing(c.logf, c.c2nHandler, httpc, pr)
- return
- }
- for _, t := range strings.Split(pr.Types, ",") {
- switch pt := tailcfg.PingType(t); pt {
- case tailcfg.PingTSMP, tailcfg.PingDisco, tailcfg.PingICMP, tailcfg.PingPeerAPI:
- go doPingerPing(c.logf, httpc, pr, c.pinger, pt)
- default:
- c.logf("unsupported ping request type: %q", t)
- }
- }
- }
- func answerHeadPing(logf logger.Logf, c *http.Client, pr *tailcfg.PingRequest) {
- ctx, cancel := context.WithTimeout(context.Background(), 15*time.Second)
- defer cancel()
- req, err := http.NewRequestWithContext(ctx, "HEAD", pr.URL, nil)
- if err != nil {
- logf("answerHeadPing: NewRequestWithContext: %v", err)
- return
- }
- if pr.Log {
- logf("answerHeadPing: sending HEAD ping to %v ...", pr.URL)
- }
- t0 := time.Now()
- _, err = c.Do(req)
- d := time.Since(t0).Round(time.Millisecond)
- if err != nil {
- logf("answerHeadPing error: %v to %v (after %v)", err, pr.URL, d)
- } else if pr.Log {
- logf("answerHeadPing complete to %v (after %v)", pr.URL, d)
- }
- }
- func answerC2NPing(logf logger.Logf, c2nHandler http.Handler, c *http.Client, pr *tailcfg.PingRequest) {
- if c2nHandler == nil {
- logf("answerC2NPing: c2nHandler not defined")
- return
- }
- hreq, err := http.ReadRequest(bufio.NewReader(bytes.NewReader(pr.Payload)))
- if err != nil {
- logf("answerC2NPing: ReadRequest: %v", err)
- return
- }
- if pr.Log {
- logf("answerC2NPing: got c2n request for %v ...", hreq.RequestURI)
- }
- handlerTimeout := time.Minute
- if v := hreq.Header.Get("C2n-Handler-Timeout"); v != "" {
- handlerTimeout, _ = time.ParseDuration(v)
- }
- handlerCtx, cancel := context.WithTimeout(context.Background(), handlerTimeout)
- defer cancel()
- hreq = hreq.WithContext(handlerCtx)
- rec := httptest.NewRecorder()
- c2nHandler.ServeHTTP(rec, hreq)
- cancel()
- c2nResBuf := new(bytes.Buffer)
- rec.Result().Write(c2nResBuf)
- replyCtx, cancel := context.WithTimeout(context.Background(), time.Minute)
- defer cancel()
- req, err := http.NewRequestWithContext(replyCtx, "POST", pr.URL, c2nResBuf)
- if err != nil {
- logf("answerC2NPing: NewRequestWithContext: %v", err)
- return
- }
- if pr.Log {
- logf("answerC2NPing: sending POST ping to %v ...", pr.URL)
- }
- t0 := time.Now()
- _, err = c.Do(req)
- d := time.Since(t0).Round(time.Millisecond)
- if err != nil {
- logf("answerC2NPing error: %v to %v (after %v)", err, pr.URL, d)
- } else if pr.Log {
- logf("answerC2NPing complete to %v (after %v)", pr.URL, d)
- }
- }
- func sleepAsRequested(ctx context.Context, logf logger.Logf, timeoutReset chan<- struct{}, d time.Duration) error {
- const maxSleep = 5 * time.Minute
- if d > maxSleep {
- logf("sleeping for %v, capped from server-requested %v ...", maxSleep, d)
- d = maxSleep
- } else {
- logf("sleeping for server-requested %v ...", d)
- }
- ticker := time.NewTicker(pollTimeout / 2)
- defer ticker.Stop()
- timer := time.NewTimer(d)
- defer timer.Stop()
- for {
- select {
- case <-ctx.Done():
- return ctx.Err()
- case <-timer.C:
- return nil
- case <-ticker.C:
- select {
- case timeoutReset <- struct{}{}:
- case <-timer.C:
- return nil
- case <-ctx.Done():
- return ctx.Err()
- }
- }
- }
- }
- // getNoiseClient returns the noise client, creating one if one doesn't exist.
- func (c *Direct) getNoiseClient() (*NoiseClient, error) {
- c.mu.Lock()
- serverNoiseKey := c.serverNoiseKey
- nc := c.noiseClient
- c.mu.Unlock()
- if serverNoiseKey.IsZero() {
- return nil, errors.New("zero serverNoiseKey")
- }
- if nc != nil {
- return nc, nil
- }
- var dp func() *tailcfg.ControlDialPlan
- if c.dialPlan != nil {
- dp = c.dialPlan.Load
- }
- nc, err, _ := c.sfGroup.Do(struct{}{}, func() (*NoiseClient, error) {
- k, err := c.getMachinePrivKey()
- if err != nil {
- return nil, err
- }
- c.logf("creating new noise client")
- nc, err := NewNoiseClient(NoiseOpts{
- PrivKey: k,
- ServerPubKey: serverNoiseKey,
- ServerURL: c.serverURL,
- Dialer: c.dialer,
- DNSCache: c.dnsCache,
- Logf: c.logf,
- NetMon: c.netMon,
- DialPlan: dp,
- })
- if err != nil {
- return nil, err
- }
- c.mu.Lock()
- defer c.mu.Unlock()
- c.noiseClient = nc
- return nc, nil
- })
- if err != nil {
- return nil, err
- }
- return nc, nil
- }
- // setDNSNoise sends the SetDNSRequest request to the control plane server over Noise,
- // requesting a DNS record be created or updated.
- func (c *Direct) setDNSNoise(ctx context.Context, req *tailcfg.SetDNSRequest) error {
- newReq := *req
- newReq.Version = tailcfg.CurrentCapabilityVersion
- nc, err := c.getNoiseClient()
- if err != nil {
- return err
- }
- res, err := nc.post(ctx, "/machine/set-dns", &newReq)
- if err != nil {
- return err
- }
- defer res.Body.Close()
- if res.StatusCode != 200 {
- msg, _ := io.ReadAll(res.Body)
- return fmt.Errorf("set-dns response: %v, %.200s", res.Status, strings.TrimSpace(string(msg)))
- }
- var setDNSRes tailcfg.SetDNSResponse
- if err := json.NewDecoder(res.Body).Decode(&setDNSRes); err != nil {
- c.logf("error decoding SetDNSResponse: %v", err)
- return fmt.Errorf("set-dns-response: %w", err)
- }
- return nil
- }
- // noiseConfigured reports whether the client can communicate with Control
- // over Noise.
- func (c *Direct) noiseConfigured() bool {
- c.mu.Lock()
- defer c.mu.Unlock()
- return !c.serverNoiseKey.IsZero()
- }
- // SetDNS sends the SetDNSRequest request to the control plane server,
- // requesting a DNS record be created or updated.
- func (c *Direct) SetDNS(ctx context.Context, req *tailcfg.SetDNSRequest) (err error) {
- metricSetDNS.Add(1)
- defer func() {
- if err != nil {
- metricSetDNSError.Add(1)
- }
- }()
- if c.noiseConfigured() {
- return c.setDNSNoise(ctx, req)
- }
- c.mu.Lock()
- serverKey := c.serverKey
- c.mu.Unlock()
- if serverKey.IsZero() {
- return errors.New("zero serverKey")
- }
- machinePrivKey, err := c.getMachinePrivKey()
- if err != nil {
- return fmt.Errorf("getMachinePrivKey: %w", err)
- }
- if machinePrivKey.IsZero() {
- return errors.New("getMachinePrivKey returned zero key")
- }
- // TODO(maisem): dedupe this codepath from SetDNSNoise.
- var serverNoiseKey key.MachinePublic
- bodyData, err := encode(req, serverKey, serverNoiseKey, machinePrivKey)
- if err != nil {
- return err
- }
- body := bytes.NewReader(bodyData)
- u := fmt.Sprintf("%s/machine/%s/set-dns", c.serverURL, machinePrivKey.Public().UntypedHexString())
- hreq, err := http.NewRequestWithContext(ctx, "POST", u, body)
- if err != nil {
- return err
- }
- res, err := c.httpc.Do(hreq)
- if err != nil {
- return err
- }
- defer res.Body.Close()
- if res.StatusCode != 200 {
- msg, _ := io.ReadAll(res.Body)
- return fmt.Errorf("set-dns response: %v, %.200s", res.Status, strings.TrimSpace(string(msg)))
- }
- var setDNSRes tailcfg.SetDNSResponse
- if err := decode(res, &setDNSRes, serverKey, serverNoiseKey, machinePrivKey); err != nil {
- c.logf("error decoding SetDNSResponse with server key %s and machine key %s: %v", serverKey, machinePrivKey.Public(), err)
- return fmt.Errorf("set-dns-response: %w", err)
- }
- return nil
- }
- func (c *Direct) DoNoiseRequest(req *http.Request) (*http.Response, error) {
- nc, err := c.getNoiseClient()
- if err != nil {
- return nil, err
- }
- return nc.Do(req)
- }
- // GetSingleUseNoiseRoundTripper returns a RoundTripper that can be only be used
- // once (and must be used once) to make a single HTTP request over the noise
- // channel to the coordination server.
- //
- // In addition to the RoundTripper, it returns the HTTP/2 channel's early noise
- // payload, if any.
- func (c *Direct) GetSingleUseNoiseRoundTripper(ctx context.Context) (http.RoundTripper, *tailcfg.EarlyNoise, error) {
- nc, err := c.getNoiseClient()
- if err != nil {
- return nil, nil, err
- }
- return nc.GetSingleUseRoundTripper(ctx)
- }
- // doPingerPing sends a Ping to pr.IP using pinger, and sends an http request back to
- // pr.URL with ping response data.
- func doPingerPing(logf logger.Logf, c *http.Client, pr *tailcfg.PingRequest, pinger Pinger, pingType tailcfg.PingType) {
- if pr.URL == "" || !pr.IP.IsValid() || pinger == nil {
- logf("invalid ping request: missing url, ip or pinger")
- return
- }
- start := time.Now()
- ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
- defer cancel()
- res, err := pinger.Ping(ctx, pr.IP, pingType)
- if err != nil {
- d := time.Since(start).Round(time.Millisecond)
- logf("doPingerPing: ping error of type %q to %v after %v: %v", pingType, pr.IP, d, err)
- return
- }
- postPingResult(start, logf, c, pr, res.ToPingResponse(pingType))
- }
- func postPingResult(start time.Time, logf logger.Logf, c *http.Client, pr *tailcfg.PingRequest, res *tailcfg.PingResponse) error {
- duration := time.Since(start)
- if pr.Log {
- if res.Err == "" {
- logf("ping to %v completed in %v. pinger.Ping took %v seconds", pr.IP, res.LatencySeconds, duration)
- } else {
- logf("ping to %v failed after %v: %v", pr.IP, duration, res.Err)
- }
- }
- ctx, cancel := context.WithTimeout(context.Background(), 15*time.Second)
- defer cancel()
- jsonPingRes, err := json.Marshal(res)
- if err != nil {
- return err
- }
- // Send the results of the Ping, back to control URL.
- req, err := http.NewRequestWithContext(ctx, "POST", pr.URL, bytes.NewReader(jsonPingRes))
- if err != nil {
- return fmt.Errorf("http.NewRequestWithContext(%q): %w", pr.URL, err)
- }
- if pr.Log {
- logf("postPingResult: sending ping results to %v ...", pr.URL)
- }
- t0 := time.Now()
- _, err = c.Do(req)
- d := time.Since(t0).Round(time.Millisecond)
- if err != nil {
- return fmt.Errorf("postPingResult error: %w to %v (after %v)", err, pr.URL, d)
- } else if pr.Log {
- logf("postPingResult complete to %v (after %v)", pr.URL, d)
- }
- return nil
- }
- // ReportHealthChange reports to the control plane a change to this node's
- // health.
- func (c *Direct) ReportHealthChange(sys health.Subsystem, sysErr error) {
- if sys == health.SysOverall {
- // We don't report these. These include things like the network is down
- // (in which case we can't report anyway) or the user wanted things
- // stopped, as opposed to the more unexpected failure types in the other
- // subsystems.
- return
- }
- np, err := c.getNoiseClient()
- if err != nil {
- // Don't report errors to control if the server doesn't support noise.
- return
- }
- req := &tailcfg.HealthChangeRequest{
- Subsys: string(sys),
- }
- if sysErr != nil {
- req.Error = sysErr.Error()
- }
- // Best effort, no logging:
- ctx, cancel := context.WithTimeout(context.Background(), 5*time.Second)
- defer cancel()
- res, err := np.post(ctx, "/machine/update-health", req)
- if err != nil {
- return
- }
- res.Body.Close()
- }
- // decodeWrappedAuthkey separates wrapping information from an authkey, if any.
- // In all cases the authkey is returned, sans wrapping information if any.
- //
- // If the authkey is wrapped, isWrapped returns true, along with the wrapping signature
- // and private key.
- func decodeWrappedAuthkey(key string, logf logger.Logf) (authKey string, isWrapped bool, sig *tka.NodeKeySignature, priv ed25519.PrivateKey) {
- authKey, suffix, found := strings.Cut(key, "--TL")
- if !found {
- return key, false, nil, nil
- }
- sigBytes, privBytes, found := strings.Cut(suffix, "-")
- if !found {
- logf("decoding wrapped auth-key: did not find delimiter")
- return key, false, nil, nil
- }
- rawSig, err := base64.RawStdEncoding.DecodeString(sigBytes)
- if err != nil {
- logf("decoding wrapped auth-key: signature decode: %v", err)
- return key, false, nil, nil
- }
- rawPriv, err := base64.RawStdEncoding.DecodeString(privBytes)
- if err != nil {
- logf("decoding wrapped auth-key: priv decode: %v", err)
- return key, false, nil, nil
- }
- sig = new(tka.NodeKeySignature)
- if err := sig.Unserialize([]byte(rawSig)); err != nil {
- logf("decoding wrapped auth-key: signature: %v", err)
- return key, false, nil, nil
- }
- priv = ed25519.PrivateKey(rawPriv)
- return authKey, true, sig, priv
- }
- var (
- metricMapRequestsActive = clientmetric.NewGauge("controlclient_map_requests_active")
- metricMapRequests = clientmetric.NewCounter("controlclient_map_requests")
- metricMapRequestsLite = clientmetric.NewCounter("controlclient_map_requests_lite")
- metricMapRequestsPoll = clientmetric.NewCounter("controlclient_map_requests_poll")
- metricMapResponseMessages = clientmetric.NewCounter("controlclient_map_response_message") // any message type
- metricMapResponsePings = clientmetric.NewCounter("controlclient_map_response_ping")
- metricMapResponseKeepAlives = clientmetric.NewCounter("controlclient_map_response_keepalive")
- metricMapResponseMap = clientmetric.NewCounter("controlclient_map_response_map") // any non-keepalive map response
- metricMapResponseMapDelta = clientmetric.NewCounter("controlclient_map_response_map_delta") // 2nd+ non-keepalive map response
- metricSetDNS = clientmetric.NewCounter("controlclient_setdns")
- metricSetDNSError = clientmetric.NewCounter("controlclient_setdns_error")
- )
|