syncthing/model/puller.go

702 lines
16 KiB
Go
Raw Normal View History

2014-07-13 00:45:33 +02:00
// Copyright (C) 2014 Jakob Borg and Contributors (see the CONTRIBUTORS file).
// All rights reserved. Use of this source code is governed by an MIT-style
// license that can be found in the LICENSE file.
2014-06-01 22:50:14 +02:00
2014-05-15 05:26:55 +02:00
package model
import (
"bytes"
"errors"
"os"
"path/filepath"
"runtime"
"time"
2014-05-15 02:18:09 +02:00
"github.com/calmh/syncthing/config"
2014-05-25 20:49:08 +02:00
"github.com/calmh/syncthing/osutil"
"github.com/calmh/syncthing/protocol"
"github.com/calmh/syncthing/scanner"
2014-05-25 20:49:08 +02:00
"github.com/calmh/syncthing/versioner"
)
type requestResult struct {
node protocol.NodeID
2014-07-12 23:06:48 +02:00
file protocol.FileInfo
filepath string // full filepath name
offset int64
data []byte
err error
}
type openFile struct {
filepath string // full filepath name
temp string // temporary filename
2014-07-06 14:46:48 +02:00
availability []protocol.NodeID
file *os.File
err error // error when opening or writing to file, all following operations are cancelled
outstanding int // number of requests we still have outstanding
done bool // we have sent all requests for this file
}
type activityMap map[protocol.NodeID]int
2014-07-06 14:46:48 +02:00
func (m activityMap) leastBusyNode(availability []protocol.NodeID) protocol.NodeID {
var low int = 2<<30 - 1
var selected protocol.NodeID
2014-07-06 14:46:48 +02:00
for _, node := range availability {
usage := m[node]
2014-07-06 14:46:48 +02:00
if usage < low {
low = usage
selected = node
}
}
m[selected]++
return selected
}
func (m activityMap) decrease(node protocol.NodeID) {
m[node]--
}
var errNoNode = errors.New("no available source node")
type puller struct {
2014-05-15 05:26:55 +02:00
cfg *config.Configuration
2014-05-23 14:31:16 +02:00
repoCfg config.RepositoryConfiguration
bq *blockQueue
model *Model
oustandingPerNode activityMap
openFiles map[string]openFile
requestSlots chan bool
blocks chan bqBlock
requestResults chan requestResult
2014-05-25 20:49:08 +02:00
versioner versioner.Versioner
}
2014-05-23 14:31:16 +02:00
func newPuller(repoCfg config.RepositoryConfiguration, model *Model, slots int, cfg *config.Configuration) *puller {
p := &puller{
2014-05-23 14:31:16 +02:00
repoCfg: repoCfg,
2014-05-15 05:26:55 +02:00
cfg: cfg,
bq: newBlockQueue(),
model: model,
oustandingPerNode: make(activityMap),
openFiles: make(map[string]openFile),
requestSlots: make(chan bool, slots),
blocks: make(chan bqBlock),
requestResults: make(chan requestResult),
}
2014-05-25 20:49:08 +02:00
if len(repoCfg.Versioning.Type) > 0 {
factory, ok := versioner.Factories[repoCfg.Versioning.Type]
if !ok {
l.Fatalf("Requested versioning type %q that does not exist", repoCfg.Versioning.Type)
}
p.versioner = factory(repoCfg.Versioning.Params)
}
if slots > 0 {
// Read/write
for i := 0; i < slots; i++ {
p.requestSlots <- true
}
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("starting puller; repo %q dir %q slots %d", repoCfg.ID, repoCfg.Directory, slots)
}
go p.run()
} else {
// Read only
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("starting puller; repo %q dir %q (read only)", repoCfg.ID, repoCfg.Directory)
}
go p.runRO()
}
return p
}
func (p *puller) run() {
go func() {
// fill blocks queue when there are free slots
for {
<-p.requestSlots
b := p.bq.get()
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("filler: queueing %q / %q offset %d copy %d", p.repoCfg.ID, b.file.Name, b.block.Offset, len(b.copy))
}
p.blocks <- b
}
}()
2014-05-15 05:26:55 +02:00
walkTicker := time.Tick(time.Duration(p.cfg.Options.RescanIntervalS) * time.Second)
timeout := time.Tick(5 * time.Second)
changed := true
var prevVer uint64
for {
// Run the pulling loop as long as there are blocks to fetch
pull:
for {
select {
case res := <-p.requestResults:
2014-05-23 14:31:16 +02:00
p.model.setState(p.repoCfg.ID, RepoSyncing)
changed = true
p.requestSlots <- true
p.handleRequestResult(res)
case b := <-p.blocks:
2014-05-23 14:31:16 +02:00
p.model.setState(p.repoCfg.ID, RepoSyncing)
changed = true
2014-04-27 12:06:11 +02:00
if p.handleBlock(b) {
// Block was fully handled, free up the slot
p.requestSlots <- true
}
case <-timeout:
if len(p.openFiles) == 0 && p.bq.empty() {
// Nothing more to do for the moment
break pull
}
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("%q: idle but have %d open files", p.repoCfg.ID, len(p.openFiles))
i := 5
for _, f := range p.openFiles {
2014-05-15 02:08:56 +02:00
l.Debugf(" %v", f)
i--
if i == 0 {
break
}
}
}
}
}
if changed {
2014-05-23 14:31:16 +02:00
p.model.setState(p.repoCfg.ID, RepoCleaning)
p.fixupDirectories()
changed = false
}
2014-05-23 14:31:16 +02:00
p.model.setState(p.repoCfg.ID, RepoIdle)
// Do a rescan if it's time for it
select {
case <-walkTicker:
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("%q: time for rescan", p.repoCfg.ID)
}
2014-05-23 14:31:16 +02:00
err := p.model.ScanRepo(p.repoCfg.ID)
if err != nil {
2014-05-23 14:31:16 +02:00
invalidateRepo(p.cfg, p.repoCfg.ID, err)
return
}
default:
}
if v := p.model.Version(p.repoCfg.ID); v > prevVer {
// Queue more blocks to fetch, if any
p.queueNeededBlocks()
prevVer = v
}
}
}
func (p *puller) runRO() {
2014-05-15 05:26:55 +02:00
walkTicker := time.Tick(time.Duration(p.cfg.Options.RescanIntervalS) * time.Second)
for _ = range walkTicker {
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("%q: time for rescan", p.repoCfg.ID)
}
2014-05-23 14:31:16 +02:00
err := p.model.ScanRepo(p.repoCfg.ID)
if err != nil {
2014-05-23 14:31:16 +02:00
invalidateRepo(p.cfg, p.repoCfg.ID, err)
return
}
}
}
func (p *puller) fixupDirectories() {
var deleteDirs []string
var changed = 0
var walkFn = func(path string, info os.FileInfo, err error) error {
if err != nil {
return err
}
if !info.IsDir() {
return nil
}
2014-05-23 14:31:16 +02:00
rn, err := filepath.Rel(p.repoCfg.Directory, path)
if err != nil {
return nil
}
if rn == "." {
return nil
}
2014-05-25 20:49:08 +02:00
if filepath.Base(rn) == ".stversions" {
2014-07-06 14:46:48 +02:00
return filepath.SkipDir
2014-05-25 20:49:08 +02:00
}
2014-05-23 14:31:16 +02:00
cur := p.model.CurrentRepoFile(p.repoCfg.ID, rn)
if cur.Name != rn {
// No matching dir in current list; weird
if debug {
l.Debugf("missing dir: %s; %v", rn, cur)
}
return nil
}
2014-05-23 12:53:26 +02:00
if protocol.IsDeleted(cur.Flags) {
2014-05-15 05:26:55 +02:00
if debug {
2014-05-15 02:08:56 +02:00
l.Debugf("queue delete dir: %v", cur)
}
// We queue the directories to delete since we walk the
// tree in depth first order and need to remove the
// directories in the opposite order.
deleteDirs = append(deleteDirs, path)
return nil
}
if !p.repoCfg.IgnorePerms && protocol.HasPermissionBits(cur.Flags) && !scanner.PermsEqual(cur.Flags, uint32(info.Mode())) {
err := os.Chmod(path, os.FileMode(cur.Flags)&os.ModePerm)
if err != nil {
2014-05-24 08:26:05 +02:00
l.Warnf("Restoring folder flags: %q: %v", path, err)
} else {
changed++
if debug {
l.Debugf("restored dir flags: %o -> %v", info.Mode()&os.ModePerm, cur)
}
}
}
if cur.Modified != info.ModTime().Unix() {
t := time.Unix(cur.Modified, 0)
err := os.Chtimes(path, t, t)
if err != nil {
if runtime.GOOS != "windows" {
// https://code.google.com/p/go/issues/detail?id=8090
l.Warnf("Restoring folder modtime: %q: %v", path, err)
}
} else {
changed++
if debug {
l.Debugf("restored dir modtime: %d -> %v", info.ModTime().Unix(), cur)
}
}
}
return nil
}
for {
deleteDirs = nil
changed = 0
2014-05-23 14:31:16 +02:00
filepath.Walk(p.repoCfg.Directory, walkFn)
var deleted = 0
// Delete any queued directories
for i := len(deleteDirs) - 1; i >= 0; i-- {
dir := deleteDirs[i]
if debug {
l.Debugln("delete dir:", dir)
}
err := os.Remove(dir)
2014-05-25 20:49:08 +02:00
if err == nil {
deleted++
} else {
l.Warnln("Delete dir:", err)
}
}
2014-05-15 05:26:55 +02:00
if debug {
l.Debugf("changed %d, deleted %d dirs", changed, deleted)
}
if changed+deleted == 0 {
return
}
}
}
func (p *puller) handleRequestResult(res requestResult) {
p.oustandingPerNode.decrease(res.node)
f := res.file
of, ok := p.openFiles[f.Name]
if !ok || of.err != nil {
// no entry in openFiles means there was an error and we've cancelled the operation
return
}
_, of.err = of.file.WriteAt(res.data, res.offset)
of.outstanding--
p.openFiles[f.Name] = of
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: wrote %q / %q offset %d outstanding %d done %v", p.repoCfg.ID, f.Name, res.offset, of.outstanding, of.done)
}
if of.done && of.outstanding == 0 {
2014-04-27 12:14:53 +02:00
p.closeFile(f)
}
}
2014-04-27 12:06:11 +02:00
// handleBlock fulfills the block request by copying, ignoring or fetching
// from the network. Returns true if the block was fully handled
// synchronously, i.e. if the slot can be reused.
func (p *puller) handleBlock(b bqBlock) bool {
f := b.file
// For directories, making sure they exist is enough.
// Deleted directories we mark as handled and delete later.
2014-05-23 12:53:26 +02:00
if protocol.IsDirectory(f.Flags) {
if !protocol.IsDeleted(f.Flags) {
2014-05-23 14:31:16 +02:00
path := filepath.Join(p.repoCfg.Directory, f.Name)
_, err := os.Stat(path)
if err != nil && os.IsNotExist(err) {
if debug {
l.Debugf("create dir: %v", f)
}
err = os.MkdirAll(path, 0777)
if err != nil {
l.Warnf("Create folder: %q: %v", path, err)
}
}
} else if debug {
l.Debugf("ignore delete dir: %v", f)
}
2014-05-23 14:31:16 +02:00
p.model.updateLocal(p.repoCfg.ID, f)
2014-04-27 12:06:11 +02:00
return true
}
if len(b.copy) > 0 && len(b.copy) == len(b.file.Blocks) && b.last {
// We are supposed to copy the entire file, and then fetch nothing.
// We don't actually need to make the copy.
if debug {
l.Debugln("taking shortcut:", f)
}
fp := filepath.Join(p.repoCfg.Directory, f.Name)
t := time.Unix(f.Modified, 0)
err := os.Chtimes(fp, t, t)
if debug && err != nil {
l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
}
if !p.repoCfg.IgnorePerms && protocol.HasPermissionBits(f.Flags) {
err = os.Chmod(fp, os.FileMode(f.Flags&0777))
if debug && err != nil {
l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
}
}
p.model.updateLocal(p.repoCfg.ID, f)
return true
}
of, ok := p.openFiles[f.Name]
of.done = b.last
if !ok {
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: %q: opening file %q", p.repoCfg.ID, f.Name)
}
2014-07-06 14:46:48 +02:00
of.availability = p.model.repoFiles[p.repoCfg.ID].Availability(f.Name)
2014-05-23 14:31:16 +02:00
of.filepath = filepath.Join(p.repoCfg.Directory, f.Name)
of.temp = filepath.Join(p.repoCfg.Directory, defTempNamer.TempName(f.Name))
dirName := filepath.Dir(of.filepath)
_, err := os.Stat(dirName)
if err != nil {
err = os.MkdirAll(dirName, 0777)
}
if err != nil {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
}
of.file, of.err = os.Create(of.temp)
if of.err != nil {
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, of.err)
}
if !b.last {
p.openFiles[f.Name] = of
}
2014-04-27 12:06:11 +02:00
return true
}
2014-05-25 20:49:08 +02:00
osutil.HideFile(of.temp)
}
if of.err != nil {
// We have already failed this file.
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: error: %q / %q has already failed: %v", p.repoCfg.ID, f.Name, of.err)
}
if b.last {
delete(p.openFiles, f.Name)
}
2014-04-27 12:06:11 +02:00
return true
}
p.openFiles[f.Name] = of
switch {
case len(b.copy) > 0:
p.handleCopyBlock(b)
2014-04-27 12:06:11 +02:00
return true
case b.block.Size > 0:
2014-04-27 12:06:11 +02:00
return p.handleRequestBlock(b)
default:
p.handleEmptyBlock(b)
2014-04-27 12:06:11 +02:00
return true
}
}
func (p *puller) handleCopyBlock(b bqBlock) {
// We have blocks to copy from the existing file
f := b.file
of := p.openFiles[f.Name]
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: copying %d blocks for %q / %q", len(b.copy), p.repoCfg.ID, f.Name)
}
var exfd *os.File
exfd, of.err = os.Open(of.filepath)
if of.err != nil {
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, of.err)
}
of.file.Close()
of.file = nil
p.openFiles[f.Name] = of
return
}
defer exfd.Close()
for _, b := range b.copy {
2014-06-18 23:57:22 +02:00
bs := make([]byte, b.Size)
_, of.err = exfd.ReadAt(bs, b.Offset)
if of.err == nil {
_, of.err = of.file.WriteAt(bs, b.Offset)
}
if of.err != nil {
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, of.err)
}
exfd.Close()
of.file.Close()
of.file = nil
p.openFiles[f.Name] = of
return
}
}
}
2014-04-27 12:06:11 +02:00
// handleRequestBlock tries to pull a block from the network. Returns true if
// the block could _not_ be fetched (i.e. it was fully handled, matching the
// return criteria of handleBlock)
func (p *puller) handleRequestBlock(b bqBlock) bool {
f := b.file
2014-04-27 12:14:53 +02:00
of, ok := p.openFiles[f.Name]
if !ok {
panic("bug: request for non-open file")
}
2014-07-06 14:46:48 +02:00
node := p.oustandingPerNode.leastBusyNode(of.availability)
if len(node) == 0 {
of.err = errNoNode
if of.file != nil {
of.file.Close()
of.file = nil
os.Remove(of.temp)
}
if b.last {
delete(p.openFiles, f.Name)
} else {
p.openFiles[f.Name] = of
}
2014-04-27 12:06:11 +02:00
return true
}
of.outstanding++
p.openFiles[f.Name] = of
go func(node protocol.NodeID, b bqBlock) {
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: requesting %q / %q offset %d size %d from %q outstanding %d", p.repoCfg.ID, f.Name, b.block.Offset, b.block.Size, node, of.outstanding)
}
2014-05-23 14:31:16 +02:00
bs, err := p.model.requestGlobal(node, p.repoCfg.ID, f.Name, b.block.Offset, int(b.block.Size), nil)
p.requestResults <- requestResult{
node: node,
file: f,
filepath: of.filepath,
offset: b.block.Offset,
data: bs,
err: err,
}
}(node, b)
2014-04-27 12:06:11 +02:00
return false
}
func (p *puller) handleEmptyBlock(b bqBlock) {
f := b.file
of := p.openFiles[f.Name]
if b.last {
if of.err == nil {
of.file.Close()
}
}
2014-05-23 12:53:26 +02:00
if protocol.IsDeleted(f.Flags) {
2014-05-15 05:26:55 +02:00
if debug {
2014-05-15 02:08:56 +02:00
l.Debugf("pull: delete %q", f.Name)
}
os.Remove(of.temp)
os.Chmod(of.filepath, 0666)
2014-05-25 20:49:08 +02:00
if p.versioner != nil {
if debug {
l.Debugln("pull: deleting with versioner")
}
if err := p.versioner.Archive(p.repoCfg.Directory, of.filepath); err == nil {
2014-05-25 20:49:08 +02:00
p.model.updateLocal(p.repoCfg.ID, f)
} else if debug {
l.Debugln("pull: error:", err)
2014-05-25 20:49:08 +02:00
}
} else if err := os.Remove(of.filepath); err == nil || os.IsNotExist(err) {
2014-05-23 14:31:16 +02:00
p.model.updateLocal(p.repoCfg.ID, f)
}
} else {
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: no blocks to fetch and nothing to copy for %q / %q", p.repoCfg.ID, f.Name)
}
t := time.Unix(f.Modified, 0)
if os.Chtimes(of.temp, t, t) != nil {
delete(p.openFiles, f.Name)
return
}
2014-05-23 14:31:16 +02:00
if !p.repoCfg.IgnorePerms && protocol.HasPermissionBits(f.Flags) && os.Chmod(of.temp, os.FileMode(f.Flags&0777)) != nil {
delete(p.openFiles, f.Name)
return
}
2014-05-25 20:49:08 +02:00
osutil.ShowFile(of.temp)
if osutil.Rename(of.temp, of.filepath) == nil {
2014-05-23 14:31:16 +02:00
p.model.updateLocal(p.repoCfg.ID, f)
}
}
delete(p.openFiles, f.Name)
}
func (p *puller) queueNeededBlocks() {
queued := 0
2014-05-23 14:31:16 +02:00
for _, f := range p.model.NeedFilesRepo(p.repoCfg.ID) {
lf := p.model.CurrentRepoFile(p.repoCfg.ID, f.Name)
have, need := scanner.BlockDiff(lf.Blocks, f.Blocks)
2014-05-15 05:26:55 +02:00
if debug {
2014-05-15 02:08:56 +02:00
l.Debugf("need:\n local: %v\n global: %v\n haveBlocks: %v\n needBlocks: %v", lf, f, have, need)
}
queued++
p.bq.put(bqAdd{
file: f,
have: have,
need: need,
})
}
2014-05-15 05:26:55 +02:00
if debug && queued > 0 {
2014-05-23 14:31:16 +02:00
l.Debugf("%q: queued %d blocks", p.repoCfg.ID, queued)
}
}
2014-04-27 12:14:53 +02:00
2014-07-12 23:06:48 +02:00
func (p *puller) closeFile(f protocol.FileInfo) {
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: closing %q / %q", p.repoCfg.ID, f.Name)
2014-04-27 12:14:53 +02:00
}
of := p.openFiles[f.Name]
of.file.Close()
defer os.Remove(of.temp)
delete(p.openFiles, f.Name)
fd, err := os.Open(of.temp)
if err != nil {
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
2014-04-27 12:14:53 +02:00
}
return
}
2014-05-15 05:26:55 +02:00
hb, _ := scanner.Blocks(fd, scanner.StandardBlockSize)
2014-04-27 12:14:53 +02:00
fd.Close()
if l0, l1 := len(hb), len(f.Blocks); l0 != l1 {
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: %q / %q: nblocks %d != %d", p.repoCfg.ID, f.Name, l0, l1)
2014-04-27 12:14:53 +02:00
}
return
}
for i := range hb {
if bytes.Compare(hb[i].Hash, f.Blocks[i].Hash) != 0 {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: %q / %q: block %d hash mismatch", p.repoCfg.ID, f.Name, i)
2014-04-27 12:14:53 +02:00
return
}
}
t := time.Unix(f.Modified, 0)
2014-05-23 14:31:16 +02:00
err = os.Chtimes(of.temp, t, t)
if debug && err != nil {
l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
}
if !p.repoCfg.IgnorePerms && protocol.HasPermissionBits(f.Flags) {
err = os.Chmod(of.temp, os.FileMode(f.Flags&0777))
if debug && err != nil {
l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
}
}
2014-05-25 20:49:08 +02:00
osutil.ShowFile(of.temp)
if p.versioner != nil {
err := p.versioner.Archive(p.repoCfg.Directory, of.filepath)
2014-05-25 20:49:08 +02:00
if err != nil {
if debug {
l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
}
return
}
}
2014-05-15 05:26:55 +02:00
if debug {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: rename %q / %q: %q", p.repoCfg.ID, f.Name, of.filepath)
2014-04-27 12:14:53 +02:00
}
2014-05-25 20:49:08 +02:00
if err := osutil.Rename(of.temp, of.filepath); err == nil {
2014-05-23 14:31:16 +02:00
p.model.updateLocal(p.repoCfg.ID, f)
2014-04-27 12:14:53 +02:00
} else {
2014-05-23 14:31:16 +02:00
l.Debugf("pull: error: %q / %q: %v", p.repoCfg.ID, f.Name, err)
2014-04-27 12:14:53 +02:00
}
}
2014-05-15 02:18:09 +02:00
2014-05-15 05:26:55 +02:00
func invalidateRepo(cfg *config.Configuration, repoID string, err error) {
2014-05-15 02:18:09 +02:00
for i := range cfg.Repositories {
repo := &cfg.Repositories[i]
if repo.ID == repoID {
repo.Invalid = err.Error()
return
}
}
}