zrepl/cmd/main.go

385 lines
8.7 KiB
Go
Raw Normal View History

2017-04-14 19:26:32 +02:00
package main
2017-04-26 20:21:18 +02:00
import (
"fmt"
2017-04-26 20:25:53 +02:00
"github.com/urfave/cli"
"github.com/zrepl/zrepl/jobrun"
2017-05-07 12:28:31 +02:00
"github.com/zrepl/zrepl/rpc"
"github.com/zrepl/zrepl/sshbytestream"
"github.com/zrepl/zrepl/zfs"
"io"
"log"
"os"
2017-05-07 12:28:31 +02:00
"runtime/debug"
"sync"
"time"
2017-04-26 20:21:18 +02:00
)
type Logger interface {
Printf(format string, v ...interface{})
}
2017-04-26 20:21:18 +02:00
var conf Config
var runner *jobrun.JobRunner
2017-05-03 18:13:50 +02:00
var logFlags int = log.LUTC | log.Ldate | log.Ltime
var defaultLog Logger
2017-04-14 19:26:32 +02:00
2017-04-26 20:21:18 +02:00
func main() {
2017-04-14 19:26:32 +02:00
2017-05-07 12:28:31 +02:00
defer func() {
2017-05-07 20:42:39 +02:00
e := recover()
defaultLog.Printf("panic:\n%s\n\n", debug.Stack())
defaultLog.Printf("error: %t %s", e, e)
2017-05-07 12:28:31 +02:00
os.Exit(1)
}()
2017-04-26 20:21:18 +02:00
app := cli.NewApp()
2017-04-14 19:26:32 +02:00
2017-04-26 20:21:18 +02:00
app.Name = "zrepl"
app.Usage = "replicate zfs datasets"
app.EnableBashCompletion = true
app.Flags = []cli.Flag{
cli.StringFlag{Name: "config"},
2017-04-14 19:26:32 +02:00
}
2017-04-26 20:25:53 +02:00
app.Before = func(c *cli.Context) (err error) {
defaultLog = log.New(os.Stderr, "", logFlags)
2017-04-26 20:21:18 +02:00
if !c.GlobalIsSet("config") {
2017-05-07 12:28:31 +02:00
return cli.NewExitError("config flag not set", 2)
2017-04-26 20:21:18 +02:00
}
if conf, err = ParseConfig(c.GlobalString("config")); err != nil {
2017-05-07 12:28:31 +02:00
return cli.NewExitError(err, 2)
2017-04-26 20:21:18 +02:00
}
2017-05-03 18:13:50 +02:00
jobrunLogger := log.New(os.Stderr, "jobrun ", logFlags)
runner = jobrun.NewJobRunner(jobrunLogger)
2017-04-26 20:21:18 +02:00
return
}
app.Commands = []cli.Command{
2017-04-26 20:25:53 +02:00
{
Name: "sink",
Aliases: []string{"s"},
Usage: "start in sink mode",
Flags: []cli.Flag{
cli.StringFlag{Name: "identity"},
2017-05-07 12:28:31 +02:00
cli.StringFlag{Name: "logfile"},
2017-04-26 20:25:53 +02:00
},
Action: doSink,
2017-04-26 20:21:18 +02:00
},
2017-04-26 20:25:53 +02:00
{
Name: "run",
Aliases: []string{"r"},
Usage: "do replication",
Action: doRun,
},
}
2017-04-14 19:26:32 +02:00
2017-05-07 12:28:31 +02:00
app.Run(os.Args)
2017-04-14 19:26:32 +02:00
2017-04-26 20:21:18 +02:00
}
2017-04-14 19:26:32 +02:00
2017-04-26 20:21:18 +02:00
func doSink(c *cli.Context) (err error) {
2017-05-07 12:28:31 +02:00
if !c.IsSet("identity") {
return cli.NewExitError("identity flag not set", 2)
}
identity := c.String("identity")
var logOut io.Writer
if c.IsSet("logfile") {
logOut, err = os.OpenFile(c.String("logfile"), os.O_CREATE|os.O_TRUNC|os.O_WRONLY, 0600)
if err != nil {
return
}
} else {
logOut = os.Stderr
}
var sshByteStream io.ReadWriteCloser
if sshByteStream, err = sshbytestream.Incoming(); err != nil {
return
}
findMapping := func(cm []ClientMapping) zfs.DatasetMapping {
for i := range cm {
if cm[i].From == identity {
return cm[i].Mapping
}
}
return nil
}
sinkLogger := log.New(logOut, fmt.Sprintf("sink[%s] ", identity), logFlags)
handler := Handler{
Logger: sinkLogger,
PushMapping: findMapping(conf.Sinks),
PullMapping: findMapping(conf.PullACLs),
}
2017-05-12 20:26:48 +02:00
if err = rpc.ListenByteStreamRPC(sshByteStream, handler, sinkLogger); err != nil {
2017-05-07 12:28:31 +02:00
//os.Exit(1)
err = cli.NewExitError(err, 1)
defaultLog.Printf("listenbytestreamerror: %#v\n", err)
}
return
2017-05-07 12:28:31 +02:00
2017-04-14 19:26:32 +02:00
}
2017-04-26 20:21:18 +02:00
func doRun(c *cli.Context) error {
2017-04-14 19:26:32 +02:00
// Do every pull, do every push
// Scheduling
var wg sync.WaitGroup
wg.Add(1)
go func() {
defer wg.Done()
runner.Start()
}()
for i := range conf.Pulls {
pull := conf.Pulls[i]
j := jobrun.Job{
Name: fmt.Sprintf("pull%d", i),
Interval: time.Duration(5 * time.Second),
Repeats: true,
2017-05-03 18:13:50 +02:00
RunFunc: func(log jobrun.Logger) error {
2017-05-07 12:28:31 +02:00
log.Printf("doing pull: %v", pull)
return doPull(pull, c, log)
},
}
runner.AddJob(j)
}
for i := range conf.Pushs {
push := conf.Pushs[i]
j := jobrun.Job{
Name: fmt.Sprintf("push%d", i),
Interval: time.Duration(5 * time.Second),
Repeats: true,
2017-05-03 18:13:50 +02:00
RunFunc: func(log jobrun.Logger) error {
log.Printf("%v: %#v\n", time.Now(), push)
return nil
},
}
runner.AddJob(j)
}
2017-05-07 12:28:31 +02:00
for {
select {
case job := <-runner.NotificationChan():
log.Printf("notificaiton on job %s: error=%v\n", job.Name, job.LastError)
}
}
wg.Wait()
2017-04-14 19:26:32 +02:00
2017-04-26 20:21:18 +02:00
return nil
2017-04-14 19:26:32 +02:00
}
2017-05-07 12:28:31 +02:00
func doPull(pull Pull, c *cli.Context, log jobrun.Logger) (err error) {
2017-05-07 12:28:31 +02:00
if lt, ok := pull.From.Transport.(LocalTransport); ok {
lt.SetHandler(Handler{
Logger: log,
PullMapping: pull.Mapping,
})
pull.From.Transport = lt
log.Printf("fixing up local transport: %#v", pull.From.Transport)
}
var remote rpc.RPCRequester
if remote, err = pull.From.Transport.Connect(); err != nil {
return
}
fsr := rpc.FilesystemRequest{
Direction: rpc.DirectionPull,
}
var remoteFilesystems []zfs.DatasetPath
if remoteFilesystems, err = remote.FilesystemRequest(fsr); err != nil {
return
}
type RemoteLocalMapping struct {
Remote zfs.DatasetPath
Local zfs.DatasetPath
LocalExists bool
}
2017-05-07 20:42:39 +02:00
replMapping := make(map[string]RemoteLocalMapping, len(remoteFilesystems))
localTraversal := zfs.NewDatasetPathForest()
localExists, err := zfs.ZFSListFilesystemExists()
if err != nil {
log.Printf("cannot get local filesystems map: %s", err)
return err
}
2017-05-07 12:28:31 +02:00
{
log.Printf("mapping using %#v\n", pull.Mapping)
for fs := range remoteFilesystems {
var err error
var localFs zfs.DatasetPath
localFs, err = pull.Mapping.Map(remoteFilesystems[fs])
if err != nil {
if err != zfs.NoMatchError {
log.Printf("error mapping %s: %#v\n", remoteFilesystems[fs], err)
return err
}
continue
}
m := RemoteLocalMapping{remoteFilesystems[fs], localFs, localExists(localFs)}
2017-05-07 20:42:39 +02:00
replMapping[m.Local.ToString()] = m
localTraversal.Add(m.Local)
2017-05-07 12:28:31 +02:00
}
}
log.Printf("remoteFilesystems: %#v\nreplMapping: %#v\n", remoteFilesystems, replMapping)
// per fs sync, assume sorted in top-down order TODO
2017-05-07 20:42:39 +02:00
localTraversal.WalkTopDown(func(v zfs.DatasetPathVisit) bool {
if v.FilledIn {
if localExists(v.Path) {
return true
}
log.Printf("creating fill-in dataset %s", v.Path)
return false
}
m, ok := replMapping[v.Path.ToString()]
if !ok {
panic("internal inconsistency: replMapping should contain mapping for any path that was not filled in by WalkTopDown()")
}
2017-05-07 12:28:31 +02:00
log := func(format string, args ...interface{}) {
log.Printf("[%s => %s]: %s", m.Remote.ToString(), m.Local.ToString(), fmt.Sprintf(format, args...))
}
log("mapping: %#v\n", m)
var versions []zfs.FilesystemVersion
if m.LocalExists {
if versions, err = zfs.ZFSListFilesystemVersions(m.Local); err != nil {
log("cannot get filesystem versions, stopping...: %v\n", m.Local.ToString(), m, err)
2017-05-07 20:42:39 +02:00
return false
2017-05-07 12:28:31 +02:00
}
}
var theirVersions []zfs.FilesystemVersion
theirVersions, err = remote.FilesystemVersionsRequest(rpc.FilesystemVersionsRequest{
Filesystem: m.Remote,
})
if err != nil {
log("cannot fetch remote filesystem versions, stopping: %s", err)
2017-05-07 20:42:39 +02:00
return false
2017-05-07 12:28:31 +02:00
}
diff := zfs.MakeFilesystemDiff(versions, theirVersions)
log("diff: %#v\n", diff)
if diff.IncrementalPath == nil {
log("performing initial sync, following policy: %#v", pull.InitialReplPolicy)
if pull.InitialReplPolicy != InitialReplPolicyMostRecent {
panic(fmt.Sprintf("policy %#v not implemented", pull.InitialReplPolicy))
}
snapsOnly := make([]zfs.FilesystemVersion, 0, len(diff.MRCAPathRight))
for s := range diff.MRCAPathRight {
if diff.MRCAPathRight[s].Type == zfs.Snapshot {
snapsOnly = append(snapsOnly, diff.MRCAPathRight[s])
}
}
if len(snapsOnly) < 1 {
log("cannot perform initial sync: no remote snapshots. stopping...")
2017-05-07 20:42:39 +02:00
return false
2017-05-07 12:28:31 +02:00
}
r := rpc.InitialTransferRequest{
Filesystem: m.Remote,
FilesystemVersion: snapsOnly[len(snapsOnly)-1],
}
log("requesting initial transfer")
var stream io.Reader
if stream, err = remote.InitialTransferRequest(r); err != nil {
log("error initial transfer request, stopping...: %s", err)
2017-05-07 20:42:39 +02:00
return false
2017-05-07 12:28:31 +02:00
}
log("received initial transfer request response. zfs recv...")
if err = zfs.ZFSRecv(m.Local, stream, "-u"); err != nil {
log("error receiving stream, stopping...: %s", err)
2017-05-07 20:42:39 +02:00
return false
2017-05-07 12:28:31 +02:00
}
log("configuring properties of received filesystem")
if err = zfs.ZFSSet(m.Local, "readonly", "on"); err != nil {
}
log("finished initial transfer")
} else if len(diff.IncrementalPath) < 2 {
log("remote and local are in sync")
} else {
log("incremental transfers using path: %#v", diff.IncrementalPath)
for i := 0; i < len(diff.IncrementalPath)-1; i++ {
from, to := diff.IncrementalPath[i], diff.IncrementalPath[i+1]
log := func(format string, args ...interface{}) {
log("[%s => %s]: %s", from.Name, to.Name, fmt.Sprintf(format, args...))
}
r := rpc.IncrementalTransferRequest{
Filesystem: m.Remote,
From: from,
To: to,
}
log("requesting incremental transfer: %#v", r)
var stream io.Reader
if stream, err = remote.IncrementalTransferRequest(r); err != nil {
log("error requesting incremental transfer, stopping...: %s", err.Error())
2017-05-07 20:42:39 +02:00
return false
2017-05-07 12:28:31 +02:00
}
log("receving incremental transfer")
if err = zfs.ZFSRecv(m.Local, stream); err != nil {
log("error receiving stream, stopping...: %s", err)
2017-05-07 20:42:39 +02:00
return false
2017-05-07 12:28:31 +02:00
}
log("finished incremental transfer")
}
log("finished incremental transfer path")
}
2017-05-07 20:42:39 +02:00
return true
})
2017-05-07 12:28:31 +02:00
return nil
}