database.go 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460
  1. // Copyright (C) 2018 The Syncthing Authors.
  2. //
  3. // This Source Code Form is subject to the terms of the Mozilla Public
  4. // License, v. 2.0. If a copy of the MPL was not distributed with this file,
  5. // You can obtain one at https://mozilla.org/MPL/2.0/.
  6. //go:generate go run ../../proto/scripts/protofmt.go database.proto
  7. //go:generate protoc -I ../../ -I . --gogofast_out=. database.proto
  8. package main
  9. import (
  10. "bufio"
  11. "cmp"
  12. "context"
  13. "encoding/binary"
  14. "io"
  15. "log"
  16. "net"
  17. "net/url"
  18. "os"
  19. "path"
  20. "slices"
  21. "time"
  22. "github.com/aws/aws-sdk-go/aws"
  23. "github.com/aws/aws-sdk-go/aws/session"
  24. "github.com/aws/aws-sdk-go/service/s3"
  25. "github.com/aws/aws-sdk-go/service/s3/s3manager"
  26. "github.com/puzpuzpuz/xsync/v3"
  27. "github.com/syncthing/syncthing/lib/protocol"
  28. )
  29. type clock interface {
  30. Now() time.Time
  31. }
  32. type defaultClock struct{}
  33. func (defaultClock) Now() time.Time {
  34. return time.Now()
  35. }
  36. type database interface {
  37. put(key *protocol.DeviceID, rec DatabaseRecord) error
  38. merge(key *protocol.DeviceID, addrs []DatabaseAddress, seen int64) error
  39. get(key *protocol.DeviceID) (DatabaseRecord, error)
  40. }
  41. type inMemoryStore struct {
  42. m *xsync.MapOf[protocol.DeviceID, DatabaseRecord]
  43. dir string
  44. flushInterval time.Duration
  45. clock clock
  46. }
  47. func newInMemoryStore(dir string, flushInterval time.Duration) *inMemoryStore {
  48. s := &inMemoryStore{
  49. m: xsync.NewMapOf[protocol.DeviceID, DatabaseRecord](),
  50. dir: dir,
  51. flushInterval: flushInterval,
  52. clock: defaultClock{},
  53. }
  54. err := s.read()
  55. if os.IsNotExist(err) {
  56. // Try to read from AWS
  57. fd, cerr := os.Create(path.Join(s.dir, "records.db"))
  58. if cerr != nil {
  59. log.Println("Error creating database file:", err)
  60. return s
  61. }
  62. if err := s3Download(fd); err != nil {
  63. log.Printf("Error reading database from S3: %v", err)
  64. }
  65. _ = fd.Close()
  66. err = s.read()
  67. }
  68. if err != nil {
  69. log.Println("Error reading database:", err)
  70. }
  71. s.calculateStatistics()
  72. return s
  73. }
  74. func (s *inMemoryStore) put(key *protocol.DeviceID, rec DatabaseRecord) error {
  75. t0 := time.Now()
  76. s.m.Store(*key, rec)
  77. databaseOperations.WithLabelValues(dbOpPut, dbResSuccess).Inc()
  78. databaseOperationSeconds.WithLabelValues(dbOpPut).Observe(time.Since(t0).Seconds())
  79. return nil
  80. }
  81. func (s *inMemoryStore) merge(key *protocol.DeviceID, addrs []DatabaseAddress, seen int64) error {
  82. t0 := time.Now()
  83. newRec := DatabaseRecord{
  84. Addresses: addrs,
  85. Seen: seen,
  86. }
  87. oldRec, _ := s.m.Load(*key)
  88. newRec = merge(newRec, oldRec)
  89. s.m.Store(*key, newRec)
  90. databaseOperations.WithLabelValues(dbOpMerge, dbResSuccess).Inc()
  91. databaseOperationSeconds.WithLabelValues(dbOpMerge).Observe(time.Since(t0).Seconds())
  92. return nil
  93. }
  94. func (s *inMemoryStore) get(key *protocol.DeviceID) (DatabaseRecord, error) {
  95. t0 := time.Now()
  96. defer func() {
  97. databaseOperationSeconds.WithLabelValues(dbOpGet).Observe(time.Since(t0).Seconds())
  98. }()
  99. rec, ok := s.m.Load(*key)
  100. if !ok {
  101. databaseOperations.WithLabelValues(dbOpGet, dbResNotFound).Inc()
  102. return DatabaseRecord{}, nil
  103. }
  104. rec.Addresses = expire(rec.Addresses, s.clock.Now().UnixNano())
  105. databaseOperations.WithLabelValues(dbOpGet, dbResSuccess).Inc()
  106. return rec, nil
  107. }
  108. func (s *inMemoryStore) Serve(ctx context.Context) error {
  109. t := time.NewTimer(s.flushInterval)
  110. defer t.Stop()
  111. if s.flushInterval <= 0 {
  112. t.Stop()
  113. }
  114. loop:
  115. for {
  116. select {
  117. case <-t.C:
  118. if err := s.write(); err != nil {
  119. log.Println("Error writing database:", err)
  120. }
  121. s.calculateStatistics()
  122. t.Reset(s.flushInterval)
  123. case <-ctx.Done():
  124. // We're done.
  125. break loop
  126. }
  127. }
  128. return s.write()
  129. }
  130. func (s *inMemoryStore) calculateStatistics() {
  131. t0 := time.Now()
  132. nowNanos := t0.UnixNano()
  133. cutoff24h := t0.Add(-24 * time.Hour).UnixNano()
  134. cutoff1w := t0.Add(-7 * 24 * time.Hour).UnixNano()
  135. current, currentIPv4, currentIPv6, last24h, last1w, errors := 0, 0, 0, 0, 0, 0
  136. s.m.Range(func(key protocol.DeviceID, rec DatabaseRecord) bool {
  137. // If there are addresses that have not expired it's a current
  138. // record, otherwise account it based on when it was last seen
  139. // (last 24 hours or last week) or finally as inactice.
  140. addrs := expire(rec.Addresses, nowNanos)
  141. switch {
  142. case len(addrs) > 0:
  143. current++
  144. seenIPv4, seenIPv6 := false, false
  145. for _, addr := range addrs {
  146. uri, err := url.Parse(addr.Address)
  147. if err != nil {
  148. continue
  149. }
  150. host, _, err := net.SplitHostPort(uri.Host)
  151. if err != nil {
  152. continue
  153. }
  154. if ip := net.ParseIP(host); ip != nil && ip.To4() != nil {
  155. seenIPv4 = true
  156. } else if ip != nil {
  157. seenIPv6 = true
  158. }
  159. if seenIPv4 && seenIPv6 {
  160. break
  161. }
  162. }
  163. if seenIPv4 {
  164. currentIPv4++
  165. }
  166. if seenIPv6 {
  167. currentIPv6++
  168. }
  169. case rec.Seen > cutoff24h:
  170. last24h++
  171. case rec.Seen > cutoff1w:
  172. last1w++
  173. default:
  174. // drop the record if it's older than a week
  175. s.m.Delete(key)
  176. }
  177. return true
  178. })
  179. databaseKeys.WithLabelValues("current").Set(float64(current))
  180. databaseKeys.WithLabelValues("currentIPv4").Set(float64(currentIPv4))
  181. databaseKeys.WithLabelValues("currentIPv6").Set(float64(currentIPv6))
  182. databaseKeys.WithLabelValues("last24h").Set(float64(last24h))
  183. databaseKeys.WithLabelValues("last1w").Set(float64(last1w))
  184. databaseKeys.WithLabelValues("error").Set(float64(errors))
  185. databaseStatisticsSeconds.Set(time.Since(t0).Seconds())
  186. }
  187. func (s *inMemoryStore) write() (err error) {
  188. t0 := time.Now()
  189. defer func() {
  190. if err == nil {
  191. databaseWriteSeconds.Set(time.Since(t0).Seconds())
  192. databaseLastWritten.Set(float64(t0.Unix()))
  193. }
  194. }()
  195. dbf := path.Join(s.dir, "records.db")
  196. fd, err := os.Create(dbf + ".tmp")
  197. if err != nil {
  198. return err
  199. }
  200. bw := bufio.NewWriter(fd)
  201. var buf []byte
  202. var rangeErr error
  203. now := s.clock.Now().UnixNano()
  204. cutoff1w := s.clock.Now().Add(-7 * 24 * time.Hour).UnixNano()
  205. s.m.Range(func(key protocol.DeviceID, value DatabaseRecord) bool {
  206. if value.Seen < cutoff1w {
  207. // drop the record if it's older than a week
  208. return true
  209. }
  210. rec := ReplicationRecord{
  211. Key: key[:],
  212. Addresses: expire(value.Addresses, now),
  213. Seen: value.Seen,
  214. }
  215. s := rec.Size()
  216. if s+4 > len(buf) {
  217. buf = make([]byte, s+4)
  218. }
  219. n, err := rec.MarshalTo(buf[4:])
  220. if err != nil {
  221. rangeErr = err
  222. return false
  223. }
  224. binary.BigEndian.PutUint32(buf, uint32(n))
  225. if _, err := bw.Write(buf[:n+4]); err != nil {
  226. rangeErr = err
  227. return false
  228. }
  229. return true
  230. })
  231. if rangeErr != nil {
  232. _ = fd.Close()
  233. return rangeErr
  234. }
  235. if err := bw.Flush(); err != nil {
  236. _ = fd.Close
  237. return err
  238. }
  239. if err := fd.Close(); err != nil {
  240. return err
  241. }
  242. if err := os.Rename(dbf+".tmp", dbf); err != nil {
  243. return err
  244. }
  245. if os.Getenv("PODINDEX") == "0" {
  246. // Upload to S3
  247. fd, err = os.Open(dbf)
  248. if err != nil {
  249. log.Printf("Error uploading database to S3: %v", err)
  250. return nil
  251. }
  252. defer fd.Close()
  253. if err := s3Upload(fd); err != nil {
  254. log.Printf("Error uploading database to S3: %v", err)
  255. }
  256. }
  257. return nil
  258. }
  259. func (s *inMemoryStore) read() error {
  260. fd, err := os.Open(path.Join(s.dir, "records.db"))
  261. if err != nil {
  262. return err
  263. }
  264. defer fd.Close()
  265. br := bufio.NewReader(fd)
  266. var buf []byte
  267. for {
  268. var n uint32
  269. if err := binary.Read(br, binary.BigEndian, &n); err != nil {
  270. if err == io.EOF {
  271. break
  272. }
  273. return err
  274. }
  275. if int(n) > len(buf) {
  276. buf = make([]byte, n)
  277. }
  278. if _, err := io.ReadFull(br, buf[:n]); err != nil {
  279. return err
  280. }
  281. rec := ReplicationRecord{}
  282. if err := rec.Unmarshal(buf[:n]); err != nil {
  283. return err
  284. }
  285. key, err := protocol.DeviceIDFromBytes(rec.Key)
  286. if err != nil {
  287. key, err = protocol.DeviceIDFromString(string(rec.Key))
  288. }
  289. if err != nil {
  290. log.Println("Bad device ID:", err)
  291. continue
  292. }
  293. slices.SortFunc(rec.Addresses, DatabaseAddress.Cmp)
  294. s.m.Store(key, DatabaseRecord{
  295. Addresses: rec.Addresses,
  296. Seen: rec.Seen,
  297. })
  298. }
  299. return nil
  300. }
  301. // merge returns the merged result of the two database records a and b. The
  302. // result is the union of the two address sets, with the newer expiry time
  303. // chosen for any duplicates.
  304. func merge(a, b DatabaseRecord) DatabaseRecord {
  305. // Both lists must be sorted for this to work.
  306. res := DatabaseRecord{
  307. Addresses: make([]DatabaseAddress, 0, max(len(a.Addresses), len(b.Addresses))),
  308. Seen: a.Seen,
  309. }
  310. if b.Seen > a.Seen {
  311. res.Seen = b.Seen
  312. }
  313. aIdx := 0
  314. bIdx := 0
  315. aAddrs := a.Addresses
  316. bAddrs := b.Addresses
  317. loop:
  318. for {
  319. switch {
  320. case aIdx == len(aAddrs) && bIdx == len(bAddrs):
  321. // both lists are exhausted, we are done
  322. break loop
  323. case aIdx == len(aAddrs):
  324. // a is exhausted, pick from b and continue
  325. res.Addresses = append(res.Addresses, bAddrs[bIdx])
  326. bIdx++
  327. continue
  328. case bIdx == len(bAddrs):
  329. // b is exhausted, pick from a and continue
  330. res.Addresses = append(res.Addresses, aAddrs[aIdx])
  331. aIdx++
  332. continue
  333. }
  334. // We have values left on both sides.
  335. aVal := aAddrs[aIdx]
  336. bVal := bAddrs[bIdx]
  337. switch {
  338. case aVal.Address == bVal.Address:
  339. // update for same address, pick newer
  340. if aVal.Expires > bVal.Expires {
  341. res.Addresses = append(res.Addresses, aVal)
  342. } else {
  343. res.Addresses = append(res.Addresses, bVal)
  344. }
  345. aIdx++
  346. bIdx++
  347. case aVal.Address < bVal.Address:
  348. // a is smallest, pick it and continue
  349. res.Addresses = append(res.Addresses, aVal)
  350. aIdx++
  351. default:
  352. // b is smallest, pick it and continue
  353. res.Addresses = append(res.Addresses, bVal)
  354. bIdx++
  355. }
  356. }
  357. return res
  358. }
  359. // expire returns the list of addresses after removing expired entries.
  360. // Expiration happen in place, so the slice given as the parameter is
  361. // destroyed. Internal order is preserved.
  362. func expire(addrs []DatabaseAddress, now int64) []DatabaseAddress {
  363. i := 0
  364. for i < len(addrs) {
  365. if addrs[i].Expires < now {
  366. copy(addrs[i:], addrs[i+1:])
  367. addrs[len(addrs)-1] = DatabaseAddress{}
  368. addrs = addrs[:len(addrs)-1]
  369. continue
  370. }
  371. i++
  372. }
  373. return addrs
  374. }
  375. func s3Upload(r io.Reader) error {
  376. sess, err := session.NewSession(&aws.Config{
  377. Region: aws.String("fr-par"),
  378. Endpoint: aws.String("s3.fr-par.scw.cloud"),
  379. })
  380. if err != nil {
  381. return err
  382. }
  383. uploader := s3manager.NewUploader(sess)
  384. _, err = uploader.Upload(&s3manager.UploadInput{
  385. Bucket: aws.String("syncthing-discovery"),
  386. Key: aws.String("discovery.db"),
  387. Body: r,
  388. })
  389. return err
  390. }
  391. func s3Download(w io.WriterAt) error {
  392. sess, err := session.NewSession(&aws.Config{
  393. Region: aws.String("fr-par"),
  394. Endpoint: aws.String("s3.fr-par.scw.cloud"),
  395. })
  396. if err != nil {
  397. return err
  398. }
  399. downloader := s3manager.NewDownloader(sess)
  400. _, err = downloader.Download(w, &s3.GetObjectInput{
  401. Bucket: aws.String("syncthing-discovery"),
  402. Key: aws.String("discovery.db"),
  403. })
  404. return err
  405. }
  406. func (d DatabaseAddress) Cmp(other DatabaseAddress) (n int) {
  407. if c := cmp.Compare(d.Address, other.Address); c != 0 {
  408. return c
  409. }
  410. return cmp.Compare(d.Expires, other.Expires)
  411. }