123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263 |
- // Copyright (C) 2015 The Syncthing Authors.
- //
- // This Source Code Form is subject to the terms of the Mozilla Public
- // License, v. 2.0. If a copy of the MPL was not distributed with this file,
- // You can obtain one at https://mozilla.org/MPL/2.0/.
- //go:generate -command counterfeiter go run github.com/maxbrunsfeld/counterfeiter/v6
- //go:generate counterfeiter -o mocks/service.go --fake-name Service . Service
- package connections
- import (
- "context"
- "crypto/tls"
- "crypto/x509"
- "fmt"
- "math"
- "net"
- "net/url"
- "sort"
- "strings"
- stdsync "sync"
- "time"
- "github.com/syncthing/syncthing/lib/config"
- "github.com/syncthing/syncthing/lib/connections/registry"
- "github.com/syncthing/syncthing/lib/discover"
- "github.com/syncthing/syncthing/lib/events"
- "github.com/syncthing/syncthing/lib/nat"
- "github.com/syncthing/syncthing/lib/osutil"
- "github.com/syncthing/syncthing/lib/protocol"
- "github.com/syncthing/syncthing/lib/svcutil"
- "github.com/syncthing/syncthing/lib/sync"
- "github.com/syncthing/syncthing/lib/util"
- // Registers NAT service providers
- _ "github.com/syncthing/syncthing/lib/pmp"
- _ "github.com/syncthing/syncthing/lib/upnp"
- "github.com/pkg/errors"
- "github.com/thejerf/suture/v4"
- "golang.org/x/time/rate"
- )
- var (
- dialers = make(map[string]dialerFactory)
- listeners = make(map[string]listenerFactory)
- )
- var (
- // Dialers and listeners return errUnsupported (or a wrapped variant)
- // when they are intentionally out of service due to configuration,
- // build, etc. This is not logged loudly.
- errUnsupported = errors.New("unsupported protocol")
- // These are specific explanations for errUnsupported.
- errDisabled = fmt.Errorf("%w: disabled by configuration", errUnsupported)
- errDeprecated = fmt.Errorf("%w: deprecated", errUnsupported)
- errNotInBuild = fmt.Errorf("%w: disabled at build time", errUnsupported)
- // Various reasons to reject a connection
- errNetworkNotAllowed = errors.New("network not allowed")
- errDeviceAlreadyConnected = errors.New("already connected to this device")
- errDeviceIgnored = errors.New("device is ignored")
- errConnLimitReached = errors.New("connection limit reached")
- errDevicePaused = errors.New("device is paused")
- )
- const (
- perDeviceWarningIntv = 15 * time.Minute
- tlsHandshakeTimeout = 10 * time.Second
- minConnectionReplaceAge = 10 * time.Second
- minConnectionLoopSleep = 5 * time.Second
- stdConnectionLoopSleep = time.Minute
- worstDialerPriority = math.MaxInt32
- recentlySeenCutoff = 7 * 24 * time.Hour
- shortLivedConnectionThreshold = 5 * time.Second
- dialMaxParallel = 64
- dialMaxParallelPerDevice = 8
- )
- // From go/src/crypto/tls/cipher_suites.go
- var tlsCipherSuiteNames = map[uint16]string{
- // TLS 1.2
- 0x0005: "TLS_RSA_WITH_RC4_128_SHA",
- 0x000a: "TLS_RSA_WITH_3DES_EDE_CBC_SHA",
- 0x002f: "TLS_RSA_WITH_AES_128_CBC_SHA",
- 0x0035: "TLS_RSA_WITH_AES_256_CBC_SHA",
- 0x003c: "TLS_RSA_WITH_AES_128_CBC_SHA256",
- 0x009c: "TLS_RSA_WITH_AES_128_GCM_SHA256",
- 0x009d: "TLS_RSA_WITH_AES_256_GCM_SHA384",
- 0xc007: "TLS_ECDHE_ECDSA_WITH_RC4_128_SHA",
- 0xc009: "TLS_ECDHE_ECDSA_WITH_AES_128_CBC_SHA",
- 0xc00a: "TLS_ECDHE_ECDSA_WITH_AES_256_CBC_SHA",
- 0xc011: "TLS_ECDHE_RSA_WITH_RC4_128_SHA",
- 0xc012: "TLS_ECDHE_RSA_WITH_3DES_EDE_CBC_SHA",
- 0xc013: "TLS_ECDHE_RSA_WITH_AES_128_CBC_SHA",
- 0xc014: "TLS_ECDHE_RSA_WITH_AES_256_CBC_SHA",
- 0xc023: "TLS_ECDHE_ECDSA_WITH_AES_128_CBC_SHA256",
- 0xc027: "TLS_ECDHE_RSA_WITH_AES_128_CBC_SHA256",
- 0xc02f: "TLS_ECDHE_RSA_WITH_AES_128_GCM_SHA256",
- 0xc02b: "TLS_ECDHE_ECDSA_WITH_AES_128_GCM_SHA256",
- 0xc030: "TLS_ECDHE_RSA_WITH_AES_256_GCM_SHA384",
- 0xc02c: "TLS_ECDHE_ECDSA_WITH_AES_256_GCM_SHA384",
- 0xcca8: "TLS_ECDHE_RSA_WITH_CHACHA20_POLY1305",
- 0xcca9: "TLS_ECDHE_ECDSA_WITH_CHACHA20_POLY1305",
- // TLS 1.3
- 0x1301: "TLS_AES_128_GCM_SHA256",
- 0x1302: "TLS_AES_256_GCM_SHA384",
- 0x1303: "TLS_CHACHA20_POLY1305_SHA256",
- }
- var tlsVersionNames = map[uint16]string{
- tls.VersionTLS12: "TLS1.2",
- tls.VersionTLS13: "TLS1.3",
- }
- // Service listens and dials all configured unconnected devices, via supported
- // dialers. Successful connections are handed to the model.
- type Service interface {
- suture.Service
- discover.AddressLister
- ListenerStatus() map[string]ListenerStatusEntry
- ConnectionStatus() map[string]ConnectionStatusEntry
- NATType() string
- }
- type ListenerStatusEntry struct {
- Error *string `json:"error"`
- LANAddresses []string `json:"lanAddresses"`
- WANAddresses []string `json:"wanAddresses"`
- }
- type ConnectionStatusEntry struct {
- When time.Time `json:"when"`
- Error *string `json:"error"`
- }
- type connWithHello struct {
- c internalConn
- hello protocol.Hello
- err error
- remoteID protocol.DeviceID
- remoteCert *x509.Certificate
- }
- type service struct {
- *suture.Supervisor
- connectionStatusHandler
- cfg config.Wrapper
- myID protocol.DeviceID
- model Model
- tlsCfg *tls.Config
- discoverer discover.Finder
- conns chan internalConn
- hellos chan *connWithHello
- bepProtocolName string
- tlsDefaultCommonName string
- limiter *limiter
- natService *nat.Service
- evLogger events.Logger
- registry *registry.Registry
- dialNow chan struct{}
- dialNowDevices map[protocol.DeviceID]struct{}
- dialNowDevicesMut sync.Mutex
- listenersMut sync.RWMutex
- listeners map[string]genericListener
- listenerTokens map[string]suture.ServiceToken
- }
- func NewService(cfg config.Wrapper, myID protocol.DeviceID, mdl Model, tlsCfg *tls.Config, discoverer discover.Finder, bepProtocolName string, tlsDefaultCommonName string, evLogger events.Logger, registry *registry.Registry) Service {
- spec := svcutil.SpecWithInfoLogger(l)
- service := &service{
- Supervisor: suture.New("connections.Service", spec),
- connectionStatusHandler: newConnectionStatusHandler(),
- cfg: cfg,
- myID: myID,
- model: mdl,
- tlsCfg: tlsCfg,
- discoverer: discoverer,
- conns: make(chan internalConn),
- hellos: make(chan *connWithHello),
- bepProtocolName: bepProtocolName,
- tlsDefaultCommonName: tlsDefaultCommonName,
- limiter: newLimiter(myID, cfg),
- natService: nat.NewService(myID, cfg),
- evLogger: evLogger,
- registry: registry,
- dialNowDevicesMut: sync.NewMutex(),
- dialNow: make(chan struct{}, 1),
- dialNowDevices: make(map[protocol.DeviceID]struct{}),
- listenersMut: sync.NewRWMutex(),
- listeners: make(map[string]genericListener),
- listenerTokens: make(map[string]suture.ServiceToken),
- }
- cfg.Subscribe(service)
- raw := cfg.RawCopy()
- // Actually starts the listeners and NAT service
- // Need to start this before service.connect so that any dials that
- // try punch through already have a listener to cling on.
- service.CommitConfiguration(raw, raw)
- // There are several moving parts here; one routine per listening address
- // (handled in configuration changing) to handle incoming connections,
- // one routine to periodically attempt outgoing connections, one routine to
- // the common handling regardless of whether the connection was
- // incoming or outgoing.
- service.Add(svcutil.AsService(service.connect, fmt.Sprintf("%s/connect", service)))
- service.Add(svcutil.AsService(service.handleConns, fmt.Sprintf("%s/handleConns", service)))
- service.Add(svcutil.AsService(service.handleHellos, fmt.Sprintf("%s/handleHellos", service)))
- service.Add(service.natService)
- svcutil.OnSupervisorDone(service.Supervisor, func() {
- service.cfg.Unsubscribe(service.limiter)
- service.cfg.Unsubscribe(service)
- })
- return service
- }
- func (s *service) handleConns(ctx context.Context) error {
- for {
- var c internalConn
- select {
- case <-ctx.Done():
- return ctx.Err()
- case c = <-s.conns:
- }
- cs := c.ConnectionState()
- // We should have negotiated the next level protocol "bep/1.0" as part
- // of the TLS handshake. Unfortunately this can't be a hard error,
- // because there are implementations out there that don't support
- // protocol negotiation (iOS for one...).
- if cs.NegotiatedProtocol != s.bepProtocolName {
- l.Infof("Peer at %s did not negotiate bep/1.0", c)
- }
- // We should have received exactly one certificate from the other
- // side. If we didn't, they don't have a device ID and we drop the
- // connection.
- certs := cs.PeerCertificates
- if cl := len(certs); cl != 1 {
- l.Infof("Got peer certificate list of length %d != 1 from peer at %s; protocol error", cl, c)
- c.Close()
- continue
- }
- remoteCert := certs[0]
- remoteID := protocol.NewDeviceID(remoteCert.Raw)
- // The device ID should not be that of ourselves. It can happen
- // though, especially in the presence of NAT hairpinning, multiple
- // clients between the same NAT gateway, and global discovery.
- if remoteID == s.myID {
- l.Debugf("Connected to myself (%s) at %s", remoteID, c)
- c.Close()
- continue
- }
- if err := s.connectionCheckEarly(remoteID, c); err != nil {
- l.Infof("Connection from %s at %s (%s) rejected: %v", remoteID, c.RemoteAddr(), c.Type(), err)
- c.Close()
- continue
- }
- _ = c.SetDeadline(time.Now().Add(20 * time.Second))
- go func() {
- hello, err := protocol.ExchangeHello(c, s.model.GetHello(remoteID))
- select {
- case s.hellos <- &connWithHello{c, hello, err, remoteID, remoteCert}:
- case <-ctx.Done():
- }
- }()
- }
- }
- func (s *service) connectionCheckEarly(remoteID protocol.DeviceID, c internalConn) error {
- if s.cfg.IgnoredDevice(remoteID) {
- return errDeviceIgnored
- }
- if max := s.cfg.Options().ConnectionLimitMax; max > 0 && s.model.NumConnections() >= max {
- // We're not allowed to accept any more connections.
- return errConnLimitReached
- }
- cfg, ok := s.cfg.Device(remoteID)
- if !ok {
- // We do go ahead exchanging hello messages to get information about the device.
- return nil
- }
- if cfg.Paused {
- return errDevicePaused
- }
- if len(cfg.AllowedNetworks) > 0 && !IsAllowedNetwork(c.RemoteAddr().String(), cfg.AllowedNetworks) {
- // The connection is not from an allowed network.
- return errNetworkNotAllowed
- }
- // Lower priority is better, just like nice etc.
- if ct, ok := s.model.Connection(remoteID); ok {
- if ct.Priority() > c.priority || time.Since(ct.Statistics().StartedAt) > minConnectionReplaceAge {
- l.Debugf("Switching connections %s (existing: %s new: %s)", remoteID, ct, c)
- } else {
- // We should not already be connected to the other party. TODO: This
- // could use some better handling. If the old connection is dead but
- // hasn't timed out yet we may want to drop *that* connection and keep
- // this one. But in case we are two devices connecting to each other
- // in parallel we don't want to do that or we end up with no
- // connections still established...
- return errDeviceAlreadyConnected
- }
- }
- return nil
- }
- func (s *service) handleHellos(ctx context.Context) error {
- var c internalConn
- var hello protocol.Hello
- var err error
- var remoteID protocol.DeviceID
- var remoteCert *x509.Certificate
- for {
- select {
- case <-ctx.Done():
- return ctx.Err()
- case withHello := <-s.hellos:
- c = withHello.c
- hello = withHello.hello
- err = withHello.err
- remoteID = withHello.remoteID
- remoteCert = withHello.remoteCert
- }
- if err != nil {
- if protocol.IsVersionMismatch(err) {
- // The error will be a relatively user friendly description
- // of what's wrong with the version compatibility. By
- // default identify the other side by device ID and IP.
- remote := fmt.Sprintf("%v (%v)", remoteID, c.RemoteAddr())
- if hello.DeviceName != "" {
- // If the name was set in the hello return, use that to
- // give the user more info about which device is the
- // affected one. It probably says more than the remote
- // IP.
- remote = fmt.Sprintf("%q (%s %s, %v)", hello.DeviceName, hello.ClientName, hello.ClientVersion, remoteID)
- }
- msg := fmt.Sprintf("Connecting to %s: %s", remote, err)
- warningFor(remoteID, msg)
- } else {
- // It's something else - connection reset or whatever
- l.Infof("Failed to exchange Hello messages with %s at %s: %s", remoteID, c, err)
- }
- c.Close()
- continue
- }
- _ = c.SetDeadline(time.Time{})
- // The Model will return an error for devices that we don't want to
- // have a connection with for whatever reason, for example unknown devices.
- if err := s.model.OnHello(remoteID, c.RemoteAddr(), hello); err != nil {
- l.Infof("Connection from %s at %s (%s) rejected: %v", remoteID, c.RemoteAddr(), c.Type(), err)
- c.Close()
- continue
- }
- deviceCfg, ok := s.cfg.Device(remoteID)
- if !ok {
- l.Infof("Device %s removed from config during connection attempt at %s", remoteID, c)
- c.Close()
- continue
- }
- // Verify the name on the certificate. By default we set it to
- // "syncthing" when generating, but the user may have replaced
- // the certificate and used another name.
- certName := deviceCfg.CertName
- if certName == "" {
- certName = s.tlsDefaultCommonName
- }
- if remoteCert.Subject.CommonName == certName {
- // All good. We do this check because our old style certificates
- // have "syncthing" in the CommonName field and no SANs, which
- // is not accepted by VerifyHostname() any more as of Go 1.15.
- } else if err := remoteCert.VerifyHostname(certName); err != nil {
- // Incorrect certificate name is something the user most
- // likely wants to know about, since it's an advanced
- // config. Warn instead of Info.
- l.Warnf("Bad certificate from %s at %s: %v", remoteID, c, err)
- c.Close()
- continue
- }
- // Wrap the connection in rate limiters. The limiter itself will
- // keep up with config changes to the rate and whether or not LAN
- // connections are limited.
- isLAN := s.isLAN(c.RemoteAddr())
- rd, wr := s.limiter.getLimiters(remoteID, c, isLAN)
- protoConn := protocol.NewConnection(remoteID, rd, wr, c, s.model, c, deviceCfg.Compression, s.cfg.FolderPasswords(remoteID))
- go func() {
- <-protoConn.Closed()
- s.dialNowDevicesMut.Lock()
- s.dialNowDevices[remoteID] = struct{}{}
- s.scheduleDialNow()
- s.dialNowDevicesMut.Unlock()
- }()
- l.Infof("Established secure connection to %s at %s", remoteID, c)
- s.model.AddConnection(protoConn, hello)
- continue
- }
- }
- func (s *service) connect(ctx context.Context) error {
- // Map of when to earliest dial each given device + address again
- nextDialAt := make(nextDialRegistry)
- // Used as delay for the first few connection attempts (adjusted up to
- // minConnectionLoopSleep), increased exponentially until it reaches
- // stdConnectionLoopSleep, at which time the normal sleep mechanism
- // kicks in.
- initialRampup := time.Second
- for {
- cfg := s.cfg.RawCopy()
- bestDialerPriority := s.bestDialerPriority(cfg)
- isInitialRampup := initialRampup < stdConnectionLoopSleep
- l.Debugln("Connection loop")
- if isInitialRampup {
- l.Debugln("Connection loop in initial rampup")
- }
- // Used for consistency throughout this loop run, as time passes
- // while we try connections etc.
- now := time.Now()
- // Attempt to dial all devices that are unconnected or can be connection-upgraded
- s.dialDevices(ctx, now, cfg, bestDialerPriority, nextDialAt, isInitialRampup)
- var sleep time.Duration
- if isInitialRampup {
- // We are in the initial rampup time, so we slowly, statically
- // increase the sleep time.
- sleep = initialRampup
- initialRampup *= 2
- } else {
- // The sleep time is until the next dial scheduled in nextDialAt,
- // clamped by stdConnectionLoopSleep as we don't want to sleep too
- // long (config changes might happen).
- sleep = nextDialAt.sleepDurationAndCleanup(now)
- }
- // ... while making sure not to loop too quickly either.
- if sleep < minConnectionLoopSleep {
- sleep = minConnectionLoopSleep
- }
- l.Debugln("Next connection loop in", sleep)
- timeout := time.NewTimer(sleep)
- select {
- case <-s.dialNow:
- // Remove affected devices from nextDialAt to dial immediately,
- // regardless of when we last dialed it (there's cool down in the
- // registry for too many repeat dials).
- s.dialNowDevicesMut.Lock()
- for device := range s.dialNowDevices {
- nextDialAt.redialDevice(device, now)
- }
- s.dialNowDevices = make(map[protocol.DeviceID]struct{})
- s.dialNowDevicesMut.Unlock()
- timeout.Stop()
- case <-timeout.C:
- case <-ctx.Done():
- return ctx.Err()
- }
- }
- }
- func (*service) bestDialerPriority(cfg config.Configuration) int {
- bestDialerPriority := worstDialerPriority
- for _, df := range dialers {
- if df.Valid(cfg) != nil {
- continue
- }
- if prio := df.Priority(); prio < bestDialerPriority {
- bestDialerPriority = prio
- }
- }
- return bestDialerPriority
- }
- func (s *service) dialDevices(ctx context.Context, now time.Time, cfg config.Configuration, bestDialerPriority int, nextDialAt nextDialRegistry, initial bool) {
- // Figure out current connection limits up front to see if there's any
- // point in resolving devices and such at all.
- allowAdditional := 0 // no limit
- connectionLimit := cfg.Options.LowestConnectionLimit()
- if connectionLimit > 0 {
- current := s.model.NumConnections()
- allowAdditional = connectionLimit - current
- if allowAdditional <= 0 {
- l.Debugf("Skipping dial because we've reached the connection limit, current %d >= limit %d", current, connectionLimit)
- return
- }
- }
- // Get device statistics for the last seen time of each device. This
- // isn't critical, so ignore the potential error.
- stats, _ := s.model.DeviceStatistics()
- queue := make(dialQueue, 0, len(cfg.Devices))
- for _, deviceCfg := range cfg.Devices {
- // Don't attempt to connect to ourselves...
- if deviceCfg.DeviceID == s.myID {
- continue
- }
- // Don't attempt to connect to paused devices...
- if deviceCfg.Paused {
- continue
- }
- // See if we are already connected and, if so, what our cutoff is
- // for dialer priority.
- priorityCutoff := worstDialerPriority
- connection, connected := s.model.Connection(deviceCfg.DeviceID)
- if connected {
- priorityCutoff = connection.Priority()
- if bestDialerPriority >= priorityCutoff {
- // Our best dialer is not any better than what we already
- // have, so nothing to do here.
- continue
- }
- }
- dialTargets := s.resolveDialTargets(ctx, now, cfg, deviceCfg, nextDialAt, initial, priorityCutoff)
- if len(dialTargets) > 0 {
- queue = append(queue, dialQueueEntry{
- id: deviceCfg.DeviceID,
- lastSeen: stats[deviceCfg.DeviceID].LastSeen,
- shortLived: stats[deviceCfg.DeviceID].LastConnectionDurationS < shortLivedConnectionThreshold.Seconds(),
- targets: dialTargets,
- })
- }
- }
- // Sort the queue in an order we think will be useful (most recent
- // first, deprioriting unstable devices, randomizing those we haven't
- // seen in a long while). If we don't do connection limiting the sorting
- // doesn't have much effect, but it may result in getting up and running
- // quicker if only a subset of configured devices are actually reachable
- // (by prioritizing those that were reachable recently).
- queue.Sort()
- // Perform dials according to the queue, stopping when we've reached the
- // allowed additional number of connections (if limited).
- numConns := 0
- var numConnsMut stdsync.Mutex
- dialSemaphore := util.NewSemaphore(dialMaxParallel)
- dialWG := new(stdsync.WaitGroup)
- dialCtx, dialCancel := context.WithCancel(ctx)
- defer func() {
- dialWG.Wait()
- dialCancel()
- }()
- for i := range queue {
- select {
- case <-dialCtx.Done():
- return
- default:
- }
- dialWG.Add(1)
- go func(entry dialQueueEntry) {
- defer dialWG.Done()
- conn, ok := s.dialParallel(dialCtx, entry.id, entry.targets, dialSemaphore)
- if !ok {
- return
- }
- numConnsMut.Lock()
- if allowAdditional == 0 || numConns < allowAdditional {
- select {
- case s.conns <- conn:
- numConns++
- if allowAdditional > 0 && numConns >= allowAdditional {
- dialCancel()
- }
- case <-dialCtx.Done():
- }
- }
- numConnsMut.Unlock()
- }(queue[i])
- }
- }
- func (s *service) resolveDialTargets(ctx context.Context, now time.Time, cfg config.Configuration, deviceCfg config.DeviceConfiguration, nextDialAt nextDialRegistry, initial bool, priorityCutoff int) []dialTarget {
- deviceID := deviceCfg.DeviceID
- addrs := s.resolveDeviceAddrs(ctx, deviceCfg)
- l.Debugln("Resolved device", deviceID, "addresses:", addrs)
- dialTargets := make([]dialTarget, 0, len(addrs))
- for _, addr := range addrs {
- // Use both device and address, as you might have two devices connected
- // to the same relay
- if !initial && nextDialAt.get(deviceID, addr).After(now) {
- l.Debugf("Not dialing %s via %v as it's not time yet", deviceID, addr)
- continue
- }
- // If we fail at any step before actually getting the dialer
- // retry in a minute
- nextDialAt.set(deviceID, addr, now.Add(time.Minute))
- uri, err := url.Parse(addr)
- if err != nil {
- s.setConnectionStatus(addr, err)
- l.Infof("Parsing dialer address %s: %v", addr, err)
- continue
- }
- if len(deviceCfg.AllowedNetworks) > 0 {
- if !IsAllowedNetwork(uri.Host, deviceCfg.AllowedNetworks) {
- s.setConnectionStatus(addr, errors.New("network disallowed"))
- l.Debugln("Network for", uri, "is disallowed")
- continue
- }
- }
- dialerFactory, err := getDialerFactory(cfg, uri)
- if err != nil {
- s.setConnectionStatus(addr, err)
- }
- if errors.Is(err, errUnsupported) {
- l.Debugf("Dialer for %v: %v", uri, err)
- continue
- } else if err != nil {
- l.Infof("Dialer for %v: %v", uri, err)
- continue
- }
- priority := dialerFactory.Priority()
- if priority >= priorityCutoff {
- l.Debugf("Not dialing using %s as priority is not better than current connection (%d >= %d)", dialerFactory, dialerFactory.Priority(), priorityCutoff)
- continue
- }
- dialer := dialerFactory.New(s.cfg.Options(), s.tlsCfg, s.registry)
- nextDialAt.set(deviceID, addr, now.Add(dialer.RedialFrequency()))
- // For LAN addresses, increase the priority so that we
- // try these first.
- switch {
- case dialerFactory.AlwaysWAN():
- // Do nothing.
- case s.isLANHost(uri.Host):
- priority--
- }
- dialTargets = append(dialTargets, dialTarget{
- addr: addr,
- dialer: dialer,
- priority: priority,
- deviceID: deviceID,
- uri: uri,
- })
- }
- return dialTargets
- }
- func (s *service) resolveDeviceAddrs(ctx context.Context, cfg config.DeviceConfiguration) []string {
- var addrs []string
- for _, addr := range cfg.Addresses {
- if addr == "dynamic" {
- if s.discoverer != nil {
- if t, err := s.discoverer.Lookup(ctx, cfg.DeviceID); err == nil {
- addrs = append(addrs, t...)
- }
- }
- } else {
- addrs = append(addrs, addr)
- }
- }
- return util.UniqueTrimmedStrings(addrs)
- }
- func (s *service) isLANHost(host string) bool {
- // Probably we are called with an ip:port combo which we can resolve as
- // a TCP address.
- if addr, err := net.ResolveTCPAddr("tcp", host); err == nil {
- return s.isLAN(addr)
- }
- // ... but this function looks general enough that someone might try
- // with just an IP as well in the future so lets allow that.
- if addr, err := net.ResolveIPAddr("ip", host); err == nil {
- return s.isLAN(addr)
- }
- return false
- }
- func (s *service) isLAN(addr net.Addr) bool {
- var ip net.IP
- switch addr := addr.(type) {
- case *net.IPAddr:
- ip = addr.IP
- case *net.TCPAddr:
- ip = addr.IP
- case *net.UDPAddr:
- ip = addr.IP
- default:
- // From the standard library, just Unix sockets.
- // If you invent your own, handle it.
- return false
- }
- if ip.IsLoopback() {
- return true
- }
- for _, lan := range s.cfg.Options().AlwaysLocalNets {
- _, ipnet, err := net.ParseCIDR(lan)
- if err != nil {
- l.Debugln("Network", lan, "is malformed:", err)
- continue
- }
- if ipnet.Contains(ip) {
- return true
- }
- }
- lans, _ := osutil.GetLans()
- for _, lan := range lans {
- if lan.Contains(ip) {
- return true
- }
- }
- return false
- }
- func (s *service) createListener(factory listenerFactory, uri *url.URL) bool {
- // must be called with listenerMut held
- l.Debugln("Starting listener", uri)
- listener := factory.New(uri, s.cfg, s.tlsCfg, s.conns, s.natService, s.registry)
- listener.OnAddressesChanged(s.logListenAddressesChangedEvent)
- // Retrying a listener many times in rapid succession is unlikely to help,
- // thus back off quickly. A listener may soon be functional again, e.g. due
- // to a network interface coming back online - retry every minute.
- spec := svcutil.SpecWithInfoLogger(l)
- spec.FailureThreshold = 2
- spec.FailureBackoff = time.Minute
- sup := suture.New(fmt.Sprintf("listenerSupervisor@%v", listener), spec)
- sup.Add(listener)
- s.listeners[uri.String()] = listener
- s.listenerTokens[uri.String()] = s.Add(sup)
- return true
- }
- func (s *service) logListenAddressesChangedEvent(l ListenerAddresses) {
- s.evLogger.Log(events.ListenAddressesChanged, map[string]interface{}{
- "address": l.URI,
- "lan": l.LANAddresses,
- "wan": l.WANAddresses,
- })
- }
- func (s *service) CommitConfiguration(from, to config.Configuration) bool {
- newDevices := make(map[protocol.DeviceID]bool, len(to.Devices))
- for _, dev := range to.Devices {
- newDevices[dev.DeviceID] = true
- }
- for _, dev := range from.Devices {
- if !newDevices[dev.DeviceID] {
- warningLimitersMut.Lock()
- delete(warningLimiters, dev.DeviceID)
- warningLimitersMut.Unlock()
- }
- }
- s.checkAndSignalConnectLoopOnUpdatedDevices(from, to)
- s.listenersMut.Lock()
- seen := make(map[string]struct{})
- for _, addr := range to.Options.ListenAddresses() {
- if addr == "" {
- // We can get an empty address if there is an empty listener
- // element in the config, indicating no listeners should be
- // used. This is not an error.
- continue
- }
- uri, err := url.Parse(addr)
- if err != nil {
- l.Warnf("Skipping malformed listener URL %q: %v", addr, err)
- continue
- }
- // Make sure we always have the canonical representation of the URL.
- // This is for consistency as we use it as a map key, but also to
- // avoid misunderstandings. We do not just use the canonicalized
- // version, because an URL that looks very similar to a human might
- // mean something entirely different to the computer (e.g.,
- // tcp:/127.0.0.1:22000 in fact being equivalent to tcp://:22000).
- if canonical := uri.String(); canonical != addr {
- l.Warnf("Skipping malformed listener URL %q (not canonical)", addr)
- continue
- }
- if _, ok := s.listeners[addr]; ok {
- seen[addr] = struct{}{}
- continue
- }
- factory, err := getListenerFactory(to, uri)
- if errors.Is(err, errUnsupported) {
- l.Debugf("Listener for %v: %v", uri, err)
- continue
- } else if err != nil {
- l.Infof("Listener for %v: %v", uri, err)
- continue
- }
- s.createListener(factory, uri)
- seen[addr] = struct{}{}
- }
- for addr, listener := range s.listeners {
- if _, ok := seen[addr]; !ok || listener.Factory().Valid(to) != nil {
- l.Debugln("Stopping listener", addr)
- s.Remove(s.listenerTokens[addr])
- delete(s.listenerTokens, addr)
- delete(s.listeners, addr)
- }
- }
- s.listenersMut.Unlock()
- return true
- }
- func (s *service) checkAndSignalConnectLoopOnUpdatedDevices(from, to config.Configuration) {
- oldDevices := from.DeviceMap()
- dial := false
- s.dialNowDevicesMut.Lock()
- for _, dev := range to.Devices {
- if dev.Paused {
- continue
- }
- if oldDev, ok := oldDevices[dev.DeviceID]; !ok || oldDev.Paused {
- s.dialNowDevices[dev.DeviceID] = struct{}{}
- dial = true
- } else if !util.EqualStrings(oldDev.Addresses, dev.Addresses) {
- dial = true
- }
- }
- if dial {
- s.scheduleDialNow()
- }
- s.dialNowDevicesMut.Unlock()
- }
- func (s *service) scheduleDialNow() {
- select {
- case s.dialNow <- struct{}{}:
- default:
- // channel is blocked - a config update is already pending for the connection loop.
- }
- }
- func (s *service) AllAddresses() []string {
- s.listenersMut.RLock()
- var addrs []string
- for _, listener := range s.listeners {
- for _, lanAddr := range listener.LANAddresses() {
- addrs = append(addrs, lanAddr.String())
- }
- for _, wanAddr := range listener.WANAddresses() {
- addrs = append(addrs, wanAddr.String())
- }
- }
- s.listenersMut.RUnlock()
- return util.UniqueTrimmedStrings(addrs)
- }
- func (s *service) ExternalAddresses() []string {
- if s.cfg.Options().AnnounceLANAddresses {
- return s.AllAddresses()
- }
- s.listenersMut.RLock()
- var addrs []string
- for _, listener := range s.listeners {
- for _, wanAddr := range listener.WANAddresses() {
- addrs = append(addrs, wanAddr.String())
- }
- }
- s.listenersMut.RUnlock()
- return util.UniqueTrimmedStrings(addrs)
- }
- func (s *service) ListenerStatus() map[string]ListenerStatusEntry {
- result := make(map[string]ListenerStatusEntry)
- s.listenersMut.RLock()
- for addr, listener := range s.listeners {
- var status ListenerStatusEntry
- if err := listener.Error(); err != nil {
- errStr := err.Error()
- status.Error = &errStr
- }
- status.LANAddresses = urlsToStrings(listener.LANAddresses())
- status.WANAddresses = urlsToStrings(listener.WANAddresses())
- result[addr] = status
- }
- s.listenersMut.RUnlock()
- return result
- }
- type connectionStatusHandler struct {
- connectionStatusMut sync.RWMutex
- connectionStatus map[string]ConnectionStatusEntry // address -> latest error/status
- }
- func newConnectionStatusHandler() connectionStatusHandler {
- return connectionStatusHandler{
- connectionStatusMut: sync.NewRWMutex(),
- connectionStatus: make(map[string]ConnectionStatusEntry),
- }
- }
- func (s *connectionStatusHandler) ConnectionStatus() map[string]ConnectionStatusEntry {
- result := make(map[string]ConnectionStatusEntry)
- s.connectionStatusMut.RLock()
- for k, v := range s.connectionStatus {
- result[k] = v
- }
- s.connectionStatusMut.RUnlock()
- return result
- }
- func (s *connectionStatusHandler) setConnectionStatus(address string, err error) {
- if errors.Is(err, context.Canceled) {
- return
- }
- status := ConnectionStatusEntry{When: time.Now().UTC().Truncate(time.Second)}
- if err != nil {
- errStr := err.Error()
- status.Error = &errStr
- }
- s.connectionStatusMut.Lock()
- s.connectionStatus[address] = status
- s.connectionStatusMut.Unlock()
- }
- func (s *service) NATType() string {
- s.listenersMut.RLock()
- defer s.listenersMut.RUnlock()
- for _, listener := range s.listeners {
- natType := listener.NATType()
- if natType != "unknown" {
- return natType
- }
- }
- return "unknown"
- }
- func getDialerFactory(cfg config.Configuration, uri *url.URL) (dialerFactory, error) {
- dialerFactory, ok := dialers[uri.Scheme]
- if !ok {
- return nil, fmt.Errorf("unknown address scheme %q", uri.Scheme)
- }
- if err := dialerFactory.Valid(cfg); err != nil {
- return nil, err
- }
- return dialerFactory, nil
- }
- func getListenerFactory(cfg config.Configuration, uri *url.URL) (listenerFactory, error) {
- listenerFactory, ok := listeners[uri.Scheme]
- if !ok {
- return nil, fmt.Errorf("unknown address scheme %q", uri.Scheme)
- }
- if err := listenerFactory.Valid(cfg); err != nil {
- return nil, err
- }
- return listenerFactory, nil
- }
- func urlsToStrings(urls []*url.URL) []string {
- strings := make([]string, len(urls))
- for i, url := range urls {
- strings[i] = url.String()
- }
- return strings
- }
- var warningLimiters = make(map[protocol.DeviceID]*rate.Limiter)
- var warningLimitersMut = sync.NewMutex()
- func warningFor(dev protocol.DeviceID, msg string) {
- warningLimitersMut.Lock()
- defer warningLimitersMut.Unlock()
- lim, ok := warningLimiters[dev]
- if !ok {
- lim = rate.NewLimiter(rate.Every(perDeviceWarningIntv), 1)
- warningLimiters[dev] = lim
- }
- if lim.Allow() {
- l.Warnln(msg)
- }
- }
- func tlsTimedHandshake(tc *tls.Conn) error {
- tc.SetDeadline(time.Now().Add(tlsHandshakeTimeout))
- defer tc.SetDeadline(time.Time{})
- return tc.Handshake()
- }
- // IsAllowedNetwork returns true if the given host (IP or resolvable
- // hostname) is in the set of allowed networks (CIDR format only).
- func IsAllowedNetwork(host string, allowed []string) bool {
- if hostNoPort, _, err := net.SplitHostPort(host); err == nil {
- host = hostNoPort
- }
- addr, err := net.ResolveIPAddr("ip", host)
- if err != nil {
- return false
- }
- for _, n := range allowed {
- result := true
- if strings.HasPrefix(n, "!") {
- result = false
- n = n[1:]
- }
- _, cidr, err := net.ParseCIDR(n)
- if err != nil {
- continue
- }
- if cidr.Contains(addr.IP) {
- return result
- }
- }
- return false
- }
- func (s *service) dialParallel(ctx context.Context, deviceID protocol.DeviceID, dialTargets []dialTarget, parentSema *util.Semaphore) (internalConn, bool) {
- // Group targets into buckets by priority
- dialTargetBuckets := make(map[int][]dialTarget, len(dialTargets))
- for _, tgt := range dialTargets {
- dialTargetBuckets[tgt.priority] = append(dialTargetBuckets[tgt.priority], tgt)
- }
- // Get all available priorities
- priorities := make([]int, 0, len(dialTargetBuckets))
- for prio := range dialTargetBuckets {
- priorities = append(priorities, prio)
- }
- // Sort the priorities so that we dial lowest first (which means highest...)
- sort.Ints(priorities)
- sema := util.MultiSemaphore{util.NewSemaphore(dialMaxParallelPerDevice), parentSema}
- for _, prio := range priorities {
- tgts := dialTargetBuckets[prio]
- res := make(chan internalConn, len(tgts))
- wg := stdsync.WaitGroup{}
- for _, tgt := range tgts {
- sema.Take(1)
- wg.Add(1)
- go func(tgt dialTarget) {
- defer func() {
- wg.Done()
- sema.Give(1)
- }()
- conn, err := tgt.Dial(ctx)
- if err == nil {
- // Closes the connection on error
- err = s.validateIdentity(conn, deviceID)
- }
- s.setConnectionStatus(tgt.addr, err)
- if err != nil {
- l.Debugln("dialing", deviceID, tgt.uri, "error:", err)
- } else {
- l.Debugln("dialing", deviceID, tgt.uri, "success:", conn)
- res <- conn
- }
- }(tgt)
- }
- // Spawn a routine which will unblock main routine in case we fail
- // to connect to anyone.
- go func() {
- wg.Wait()
- close(res)
- }()
- // Wait for the first connection, or for channel closure.
- if conn, ok := <-res; ok {
- // Got a connection, means more might come back, hence spawn a
- // routine that will do the discarding.
- l.Debugln("connected to", deviceID, prio, "using", conn, conn.priority)
- go func(deviceID protocol.DeviceID, prio int) {
- wg.Wait()
- l.Debugln("discarding", len(res), "connections while connecting to", deviceID, prio)
- for conn := range res {
- conn.Close()
- }
- }(deviceID, prio)
- return conn, ok
- }
- // Failed to connect, report that fact.
- l.Debugln("failed to connect to", deviceID, prio)
- }
- return internalConn{}, false
- }
- func (s *service) validateIdentity(c internalConn, expectedID protocol.DeviceID) error {
- cs := c.ConnectionState()
- // We should have received exactly one certificate from the other
- // side. If we didn't, they don't have a device ID and we drop the
- // connection.
- certs := cs.PeerCertificates
- if cl := len(certs); cl != 1 {
- l.Infof("Got peer certificate list of length %d != 1 from peer at %s; protocol error", cl, c)
- c.Close()
- return fmt.Errorf("expected 1 certificate, got %d", cl)
- }
- remoteCert := certs[0]
- remoteID := protocol.NewDeviceID(remoteCert.Raw)
- // The device ID should not be that of ourselves. It can happen
- // though, especially in the presence of NAT hairpinning, multiple
- // clients between the same NAT gateway, and global discovery.
- if remoteID == s.myID {
- l.Debugf("Connected to myself (%s) at %s", remoteID, c)
- c.Close()
- return errors.New("connected to self")
- }
- // We should see the expected device ID
- if !remoteID.Equals(expectedID) {
- c.Close()
- return fmt.Errorf("unexpected device id, expected %s got %s", expectedID, remoteID)
- }
- return nil
- }
- type nextDialRegistry map[protocol.DeviceID]nextDialDevice
- type nextDialDevice struct {
- nextDial map[string]time.Time
- coolDownIntervalStart time.Time
- attempts int
- }
- func (r nextDialRegistry) get(device protocol.DeviceID, addr string) time.Time {
- return r[device].nextDial[addr]
- }
- const (
- dialCoolDownInterval = 2 * time.Minute
- dialCoolDownDelay = 5 * time.Minute
- dialCoolDownMaxAttemps = 3
- )
- // redialDevice marks the device for immediate redial, unless the remote keeps
- // dropping established connections. Thus we keep track of when the first forced
- // re-dial happened, and how many attempts happen in the dialCoolDownInterval
- // after that. If it's more than dialCoolDownMaxAttempts, don't force-redial
- // that device for dialCoolDownDelay (regular dials still happen).
- func (r nextDialRegistry) redialDevice(device protocol.DeviceID, now time.Time) {
- dev, ok := r[device]
- if !ok {
- r[device] = nextDialDevice{
- nextDial: make(map[string]time.Time),
- coolDownIntervalStart: now,
- attempts: 1,
- }
- return
- }
- if dev.attempts == 0 || now.Before(dev.coolDownIntervalStart.Add(dialCoolDownInterval)) {
- if dev.attempts >= dialCoolDownMaxAttemps {
- // Device has been force redialed too often - let it cool down.
- return
- }
- if dev.attempts == 0 {
- dev.coolDownIntervalStart = now
- }
- dev.attempts++
- dev.nextDial = make(map[string]time.Time)
- return
- }
- if dev.attempts >= dialCoolDownMaxAttemps && now.Before(dev.coolDownIntervalStart.Add(dialCoolDownDelay)) {
- return // Still cooling down
- }
- delete(r, device)
- }
- func (r nextDialRegistry) set(device protocol.DeviceID, addr string, next time.Time) {
- if _, ok := r[device]; !ok {
- r[device] = nextDialDevice{nextDial: make(map[string]time.Time)}
- }
- r[device].nextDial[addr] = next
- }
- func (r nextDialRegistry) sleepDurationAndCleanup(now time.Time) time.Duration {
- sleep := stdConnectionLoopSleep
- for id, dev := range r {
- for address, next := range dev.nextDial {
- if next.Before(now) {
- // Expired entry, address was not seen in last pass(es)
- delete(dev.nextDial, address)
- continue
- }
- if cur := next.Sub(now); cur < sleep {
- sleep = cur
- }
- }
- if dev.attempts > 0 {
- interval := dialCoolDownInterval
- if dev.attempts >= dialCoolDownMaxAttemps {
- interval = dialCoolDownDelay
- }
- if now.After(dev.coolDownIntervalStart.Add(interval)) {
- dev.attempts = 0
- }
- }
- if len(dev.nextDial) == 0 && dev.attempts == 0 {
- delete(r, id)
- }
- }
- return sleep
- }
|