puller.go 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667
  1. package model
  2. import (
  3. "bytes"
  4. "errors"
  5. "os"
  6. "path/filepath"
  7. "time"
  8. "github.com/calmh/syncthing/buffers"
  9. "github.com/calmh/syncthing/cid"
  10. "github.com/calmh/syncthing/config"
  11. "github.com/calmh/syncthing/osutil"
  12. "github.com/calmh/syncthing/protocol"
  13. "github.com/calmh/syncthing/scanner"
  14. "github.com/calmh/syncthing/versioner"
  15. )
  16. type requestResult struct {
  17. node string
  18. file scanner.File
  19. filepath string // full filepath name
  20. offset int64
  21. data []byte
  22. err error
  23. }
  24. type openFile struct {
  25. filepath string // full filepath name
  26. temp string // temporary filename
  27. availability uint64 // availability bitset
  28. file *os.File
  29. err error // error when opening or writing to file, all following operations are cancelled
  30. outstanding int // number of requests we still have outstanding
  31. done bool // we have sent all requests for this file
  32. }
  33. type activityMap map[string]int
  34. func (m activityMap) leastBusyNode(availability uint64, cm *cid.Map) string {
  35. var low int = 2<<30 - 1
  36. var selected string
  37. for _, node := range cm.Names() {
  38. id := cm.Get(node)
  39. if id == cid.LocalID {
  40. continue
  41. }
  42. usage := m[node]
  43. if availability&(1<<id) != 0 {
  44. if usage < low {
  45. low = usage
  46. selected = node
  47. }
  48. }
  49. }
  50. m[selected]++
  51. return selected
  52. }
  53. func (m activityMap) decrease(node string) {
  54. m[node]--
  55. }
  56. var errNoNode = errors.New("no available source node")
  57. type puller struct {
  58. cfg *config.Configuration
  59. repoCfg config.RepositoryConfiguration
  60. bq *blockQueue
  61. model *Model
  62. oustandingPerNode activityMap
  63. openFiles map[string]openFile
  64. requestSlots chan bool
  65. blocks chan bqBlock
  66. requestResults chan requestResult
  67. versioner versioner.Versioner
  68. }
  69. func newPuller(repoCfg config.RepositoryConfiguration, model *Model, slots int, cfg *config.Configuration) *puller {
  70. p := &puller{
  71. repoCfg: repoCfg,
  72. cfg: cfg,
  73. bq: newBlockQueue(),
  74. model: model,
  75. oustandingPerNode: make(activityMap),
  76. openFiles: make(map[string]openFile),
  77. requestSlots: make(chan bool, slots),
  78. blocks: make(chan bqBlock),
  79. requestResults: make(chan requestResult),
  80. }
  81. if len(repoCfg.Versioning.Type) > 0 {
  82. factory, ok := versioner.Factories[repoCfg.Versioning.Type]
  83. if !ok {
  84. l.Fatalf("Requested versioning type %q that does not exist", repoCfg.Versioning.Type)
  85. }
  86. p.versioner = factory(repoCfg.Versioning.Params)
  87. }
  88. if slots > 0 {
  89. // Read/write
  90. for i := 0; i < slots; i++ {
  91. p.requestSlots <- true
  92. }
  93. if debug {
  94. l.Debugf("starting puller; repo %q dir %q slots %d", repoCfg.ID, repoCfg.Directory, slots)
  95. }
  96. go p.run()
  97. } else {
  98. // Read only
  99. if debug {
  100. l.Debugf("starting puller; repo %q dir %q (read only)", repoCfg.ID, repoCfg.Directory)
  101. }
  102. go p.runRO()
  103. }
  104. return p
  105. }
  106. func (p *puller) run() {
  107. go func() {
  108. // fill blocks queue when there are free slots
  109. for {
  110. <-p.requestSlots
  111. b := p.bq.get()
  112. if debug {
  113. l.Debugf("filler: queueing %q / %q offset %d copy %d", p.repoCfg.ID, b.file.Name, b.block.Offset, len(b.copy))
  114. }
  115. p.blocks <- b
  116. }
  117. }()
  118. walkTicker := time.Tick(time.Duration(p.cfg.Options.RescanIntervalS) * time.Second)
  119. timeout := time.Tick(5 * time.Second)
  120. changed := true
  121. for {
  122. // Run the pulling loop as long as there are blocks to fetch
  123. pull:
  124. for {
  125. select {
  126. case res := <-p.requestResults:
  127. p.model.setState(p.repoCfg.ID, RepoSyncing)
  128. changed = true
  129. p.requestSlots <- true
  130. p.handleRequestResult(res)
  131. case b := <-p.blocks:
  132. p.model.setState(p.repoCfg.ID, RepoSyncing)
  133. changed = true
  134. if p.handleBlock(b) {
  135. // Block was fully handled, free up the slot
  136. p.requestSlots <- true
  137. }
  138. case <-timeout:
  139. if len(p.openFiles) == 0 && p.bq.empty() {
  140. // Nothing more to do for the moment
  141. break pull
  142. }
  143. if debug {
  144. l.Debugf("%q: idle but have %d open files", p.repoCfg.ID, len(p.openFiles))
  145. i := 5
  146. for _, f := range p.openFiles {
  147. l.Debugf(" %v", f)
  148. i--
  149. if i == 0 {
  150. break
  151. }
  152. }
  153. }
  154. }
  155. }
  156. if changed {
  157. p.model.setState(p.repoCfg.ID, RepoCleaning)
  158. p.fixupDirectories()
  159. changed = false
  160. }
  161. p.model.setState(p.repoCfg.ID, RepoIdle)
  162. // Do a rescan if it's time for it
  163. select {
  164. case <-walkTicker:
  165. if debug {
  166. l.Debugf("%q: time for rescan", p.repoCfg.ID)
  167. }
  168. err := p.model.ScanRepo(p.repoCfg.ID)
  169. if err != nil {
  170. invalidateRepo(p.cfg, p.repoCfg.ID, err)
  171. return
  172. }
  173. default:
  174. }
  175. // Queue more blocks to fetch, if any
  176. p.queueNeededBlocks()
  177. }
  178. }
  179. func (p *puller) runRO() {
  180. walkTicker := time.Tick(time.Duration(p.cfg.Options.RescanIntervalS) * time.Second)
  181. for _ = range walkTicker {
  182. if debug {
  183. l.Debugf("%q: time for rescan", p.repoCfg.ID)
  184. }
  185. err := p.model.ScanRepo(p.repoCfg.ID)
  186. if err != nil {
  187. invalidateRepo(p.cfg, p.repoCfg.ID, err)
  188. return
  189. }
  190. }
  191. }
  192. func (p *puller) fixupDirectories() {
  193. var deleteDirs []string
  194. var changed = 0
  195. var walkFn = func(path string, info os.FileInfo, err error) error {
  196. if !info.IsDir() {
  197. return nil
  198. }
  199. rn, err := filepath.Rel(p.repoCfg.Directory, path)
  200. if err != nil {
  201. return nil
  202. }
  203. if rn == "." {
  204. return nil
  205. }
  206. if filepath.Base(rn) == ".stversions" {
  207. return nil
  208. }
  209. cur := p.model.CurrentRepoFile(p.repoCfg.ID, rn)
  210. if cur.Name != rn {
  211. // No matching dir in current list; weird
  212. if debug {
  213. l.Debugf("missing dir: %s; %v", rn, cur)
  214. }
  215. return nil
  216. }
  217. if protocol.IsDeleted(cur.Flags) {
  218. if debug {
  219. l.Debugf("queue delete dir: %v", cur)
  220. }
  221. // We queue the directories to delete since we walk the
  222. // tree in depth first order and need to remove the
  223. // directories in the opposite order.
  224. deleteDirs = append(deleteDirs, path)
  225. return nil
  226. }
  227. if !scanner.PermsEqual(cur.Flags, uint32(info.Mode())) {
  228. err := os.Chmod(path, os.FileMode(cur.Flags)&os.ModePerm)
  229. if err != nil {
  230. l.Warnf("Restoring folder flags: %q: %v", path, err)
  231. } else {
  232. changed++
  233. if debug {
  234. l.Debugf("restored dir flags: %o -> %v", info.Mode()&os.ModePerm, cur)
  235. }
  236. }
  237. }
  238. if cur.Modified != info.ModTime().Unix() {
  239. t := time.Unix(cur.Modified, 0)
  240. err := os.Chtimes(path, t, t)
  241. if err != nil {
  242. l.Warnf("Restoring folder modtime: %q: %v", path, err)
  243. } else {
  244. changed++
  245. if debug {
  246. l.Debugf("restored dir modtime: %d -> %v", info.ModTime().Unix(), cur)
  247. }
  248. }
  249. }
  250. return nil
  251. }
  252. for {
  253. deleteDirs = nil
  254. changed = 0
  255. filepath.Walk(p.repoCfg.Directory, walkFn)
  256. var deleted = 0
  257. // Delete any queued directories
  258. for i := len(deleteDirs) - 1; i >= 0; i-- {
  259. dir := deleteDirs[i]
  260. if debug {
  261. l.Debugln("delete dir:", dir)
  262. }
  263. err := os.Remove(dir)
  264. if err == nil {
  265. deleted++
  266. } else if p.versioner == nil { // Failures are expected in the presence of versioning
  267. l.Warnln(err)
  268. }
  269. }
  270. if debug {
  271. l.Debugf("changed %d, deleted %d dirs", changed, deleted)
  272. }
  273. if changed+deleted == 0 {
  274. return
  275. }
  276. }
  277. }
  278. func (p *puller) handleRequestResult(res requestResult) {
  279. p.oustandingPerNode.decrease(res.node)
  280. f := res.file
  281. of, ok := p.openFiles[f.Name]
  282. if !ok || of.err != nil {
  283. // no entry in openFiles means there was an error and we've cancelled the operation
  284. return
  285. }
  286. _, of.err = of.file.WriteAt(res.data, res.offset)
  287. buffers.Put(res.data)
  288. of.outstanding--
  289. p.openFiles[f.Name] = of
  290. if debug {
  291. l.Debugf("pull: wrote %q / %q offset %d outstanding %d done %v", p.repoCfg.ID, f.Name, res.offset, of.outstanding, of.done)
  292. }
  293. if of.done && of.outstanding == 0 {
  294. p.closeFile(f)
  295. }
  296. }
  297. // handleBlock fulfills the block request by copying, ignoring or fetching
  298. // from the network. Returns true if the block was fully handled
  299. // synchronously, i.e. if the slot can be reused.
  300. func (p *puller) handleBlock(b bqBlock) bool {
  301. f := b.file
  302. // For directories, making sure they exist is enough.
  303. // Deleted directories we mark as handled and delete later.
  304. if protocol.IsDirectory(f.Flags) {
  305. if !protocol.IsDeleted(f.Flags) {
  306. path := filepath.Join(p.repoCfg.Directory, f.Name)
  307. _, err := os.Stat(path)
  308. if err != nil && os.IsNotExist(err) {
  309. if debug {
  310. l.Debugf("create dir: %v", f)
  311. }
  312. err = os.MkdirAll(path, 0777)
  313. if err != nil {
  314. l.Warnf("Create folder: %q: %v", path, err)
  315. }
  316. }
  317. } else if debug {
  318. l.Debugf("ignore delete dir: %v", f)
  319. }
  320. p.model.updateLocal(p.repoCfg.ID, f)
  321. return true
  322. }
  323. of, ok := p.openFiles[f.Name]
  324. of.done = b.last
  325. if !ok {
  326. if debug {
  327. l.Debugf("pull: %q: opening file %q", p.repoCfg.ID, f.Name)
  328. }
  329. of.availability = uint64(p.model.repoFiles[p.repoCfg.ID].Availability(f.Name))
  330. of.filepath = filepath.Join(p.repoCfg.Directory, f.Name)
  331. of.temp = filepath.Join(p.repoCfg.Directory, defTempNamer.TempName(f.Name))
  332. dirName := filepath.Dir(of.filepath)
  333. _, err := os.Stat(dirName)
  334. if err != nil {
  335. err = os.MkdirAll(dirName, 0777)
  336. }
  337. if err != nil {
  338. l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
  339. }
  340. of.file, of.err = os.Create(of.temp)
  341. if of.err != nil {
  342. if debug {
  343. l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, of.err)
  344. }
  345. if !b.last {
  346. p.openFiles[f.Name] = of
  347. }
  348. return true
  349. }
  350. osutil.HideFile(of.temp)
  351. }
  352. if of.err != nil {
  353. // We have already failed this file.
  354. if debug {
  355. l.Debugf("pull: error: %q / %q has already failed: %v", p.repoCfg.ID, f.Name, of.err)
  356. }
  357. if b.last {
  358. delete(p.openFiles, f.Name)
  359. }
  360. return true
  361. }
  362. p.openFiles[f.Name] = of
  363. switch {
  364. case len(b.copy) > 0:
  365. p.handleCopyBlock(b)
  366. return true
  367. case b.block.Size > 0:
  368. return p.handleRequestBlock(b)
  369. default:
  370. p.handleEmptyBlock(b)
  371. return true
  372. }
  373. }
  374. func (p *puller) handleCopyBlock(b bqBlock) {
  375. // We have blocks to copy from the existing file
  376. f := b.file
  377. of := p.openFiles[f.Name]
  378. if debug {
  379. l.Debugf("pull: copying %d blocks for %q / %q", len(b.copy), p.repoCfg.ID, f.Name)
  380. }
  381. var exfd *os.File
  382. exfd, of.err = os.Open(of.filepath)
  383. if of.err != nil {
  384. if debug {
  385. l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, of.err)
  386. }
  387. of.file.Close()
  388. of.file = nil
  389. p.openFiles[f.Name] = of
  390. return
  391. }
  392. defer exfd.Close()
  393. for _, b := range b.copy {
  394. bs := buffers.Get(int(b.Size))
  395. _, of.err = exfd.ReadAt(bs, b.Offset)
  396. if of.err == nil {
  397. _, of.err = of.file.WriteAt(bs, b.Offset)
  398. }
  399. buffers.Put(bs)
  400. if of.err != nil {
  401. if debug {
  402. l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, of.err)
  403. }
  404. exfd.Close()
  405. of.file.Close()
  406. of.file = nil
  407. p.openFiles[f.Name] = of
  408. return
  409. }
  410. }
  411. }
  412. // handleRequestBlock tries to pull a block from the network. Returns true if
  413. // the block could _not_ be fetched (i.e. it was fully handled, matching the
  414. // return criteria of handleBlock)
  415. func (p *puller) handleRequestBlock(b bqBlock) bool {
  416. f := b.file
  417. of, ok := p.openFiles[f.Name]
  418. if !ok {
  419. panic("bug: request for non-open file")
  420. }
  421. node := p.oustandingPerNode.leastBusyNode(of.availability, p.model.cm)
  422. if len(node) == 0 {
  423. of.err = errNoNode
  424. if of.file != nil {
  425. of.file.Close()
  426. of.file = nil
  427. os.Remove(of.temp)
  428. }
  429. if b.last {
  430. delete(p.openFiles, f.Name)
  431. } else {
  432. p.openFiles[f.Name] = of
  433. }
  434. return true
  435. }
  436. of.outstanding++
  437. p.openFiles[f.Name] = of
  438. go func(node string, b bqBlock) {
  439. if debug {
  440. l.Debugf("pull: requesting %q / %q offset %d size %d from %q outstanding %d", p.repoCfg.ID, f.Name, b.block.Offset, b.block.Size, node, of.outstanding)
  441. }
  442. bs, err := p.model.requestGlobal(node, p.repoCfg.ID, f.Name, b.block.Offset, int(b.block.Size), nil)
  443. p.requestResults <- requestResult{
  444. node: node,
  445. file: f,
  446. filepath: of.filepath,
  447. offset: b.block.Offset,
  448. data: bs,
  449. err: err,
  450. }
  451. }(node, b)
  452. return false
  453. }
  454. func (p *puller) handleEmptyBlock(b bqBlock) {
  455. f := b.file
  456. of := p.openFiles[f.Name]
  457. if b.last {
  458. if of.err == nil {
  459. of.file.Close()
  460. }
  461. }
  462. if protocol.IsDeleted(f.Flags) {
  463. if debug {
  464. l.Debugf("pull: delete %q", f.Name)
  465. }
  466. os.Remove(of.temp)
  467. os.Chmod(of.filepath, 0666)
  468. if p.versioner != nil {
  469. if err := p.versioner.Archive(of.filepath); err == nil {
  470. p.model.updateLocal(p.repoCfg.ID, f)
  471. }
  472. } else if err := os.Remove(of.filepath); err == nil || os.IsNotExist(err) {
  473. p.model.updateLocal(p.repoCfg.ID, f)
  474. }
  475. } else {
  476. if debug {
  477. l.Debugf("pull: no blocks to fetch and nothing to copy for %q / %q", p.repoCfg.ID, f.Name)
  478. }
  479. t := time.Unix(f.Modified, 0)
  480. if os.Chtimes(of.temp, t, t) != nil {
  481. delete(p.openFiles, f.Name)
  482. return
  483. }
  484. if !p.repoCfg.IgnorePerms && protocol.HasPermissionBits(f.Flags) && os.Chmod(of.temp, os.FileMode(f.Flags&0777)) != nil {
  485. delete(p.openFiles, f.Name)
  486. return
  487. }
  488. osutil.ShowFile(of.temp)
  489. if osutil.Rename(of.temp, of.filepath) == nil {
  490. p.model.updateLocal(p.repoCfg.ID, f)
  491. }
  492. }
  493. delete(p.openFiles, f.Name)
  494. }
  495. func (p *puller) queueNeededBlocks() {
  496. queued := 0
  497. for _, f := range p.model.NeedFilesRepo(p.repoCfg.ID) {
  498. lf := p.model.CurrentRepoFile(p.repoCfg.ID, f.Name)
  499. have, need := scanner.BlockDiff(lf.Blocks, f.Blocks)
  500. if debug {
  501. l.Debugf("need:\n local: %v\n global: %v\n haveBlocks: %v\n needBlocks: %v", lf, f, have, need)
  502. }
  503. queued++
  504. p.bq.put(bqAdd{
  505. file: f,
  506. have: have,
  507. need: need,
  508. })
  509. }
  510. if debug && queued > 0 {
  511. l.Debugf("%q: queued %d blocks", p.repoCfg.ID, queued)
  512. }
  513. }
  514. func (p *puller) closeFile(f scanner.File) {
  515. if debug {
  516. l.Debugf("pull: closing %q / %q", p.repoCfg.ID, f.Name)
  517. }
  518. of := p.openFiles[f.Name]
  519. of.file.Close()
  520. defer os.Remove(of.temp)
  521. delete(p.openFiles, f.Name)
  522. fd, err := os.Open(of.temp)
  523. if err != nil {
  524. if debug {
  525. l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
  526. }
  527. return
  528. }
  529. hb, _ := scanner.Blocks(fd, scanner.StandardBlockSize)
  530. fd.Close()
  531. if l0, l1 := len(hb), len(f.Blocks); l0 != l1 {
  532. if debug {
  533. l.Debugf("pull: %q / %q: nblocks %d != %d", p.repoCfg.ID, f.Name, l0, l1)
  534. }
  535. return
  536. }
  537. for i := range hb {
  538. if bytes.Compare(hb[i].Hash, f.Blocks[i].Hash) != 0 {
  539. l.Debugf("pull: %q / %q: block %d hash mismatch", p.repoCfg.ID, f.Name, i)
  540. return
  541. }
  542. }
  543. t := time.Unix(f.Modified, 0)
  544. err = os.Chtimes(of.temp, t, t)
  545. if debug && err != nil {
  546. l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
  547. }
  548. if !p.repoCfg.IgnorePerms && protocol.HasPermissionBits(f.Flags) {
  549. err = os.Chmod(of.temp, os.FileMode(f.Flags&0777))
  550. if debug && err != nil {
  551. l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
  552. }
  553. }
  554. osutil.ShowFile(of.temp)
  555. if p.versioner != nil {
  556. err := p.versioner.Archive(of.filepath)
  557. if err != nil {
  558. if debug {
  559. l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
  560. }
  561. return
  562. }
  563. }
  564. if debug {
  565. l.Debugf("pull: rename %q / %q: %q", p.repoCfg.ID, f.Name, of.filepath)
  566. }
  567. if err := osutil.Rename(of.temp, of.filepath); err == nil {
  568. p.model.updateLocal(p.repoCfg.ID, f)
  569. } else {
  570. l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
  571. }
  572. }
  573. func invalidateRepo(cfg *config.Configuration, repoID string, err error) {
  574. for i := range cfg.Repositories {
  575. repo := &cfg.Repositories[i]
  576. if repo.ID == repoID {
  577. repo.Invalid = err.Error()
  578. return
  579. }
  580. }
  581. }