mirror of
https://github.com/zrepl/zrepl.git
synced 2024-12-29 10:28:53 +01:00
264 lines
6.2 KiB
Go
264 lines
6.2 KiB
Go
package cmd
|
|
|
|
import (
|
|
"net"
|
|
"os"
|
|
"os/signal"
|
|
"syscall"
|
|
"time"
|
|
|
|
"context"
|
|
"fmt"
|
|
|
|
"github.com/mitchellh/mapstructure"
|
|
"github.com/pkg/errors"
|
|
"github.com/problame/go-streamrpc"
|
|
"github.com/zrepl/zrepl/cmd/replication.v2"
|
|
)
|
|
|
|
type PullJob struct {
|
|
Name string
|
|
Connect streamrpc.Connecter
|
|
Interval time.Duration
|
|
Mapping *DatasetMapFilter
|
|
// constructed from mapping during parsing
|
|
pruneFilter *DatasetMapFilter
|
|
SnapshotPrefix string
|
|
InitialReplPolicy InitialReplPolicy
|
|
Prune PrunePolicy
|
|
Debug JobDebugSettings
|
|
|
|
task *Task
|
|
}
|
|
|
|
func parsePullJob(c JobParsingContext, name string, i map[string]interface{}) (j *PullJob, err error) {
|
|
|
|
var asMap struct {
|
|
Connect map[string]interface{}
|
|
Interval string
|
|
Mapping map[string]string
|
|
InitialReplPolicy string `mapstructure:"initial_repl_policy"`
|
|
Prune map[string]interface{}
|
|
SnapshotPrefix string `mapstructure:"snapshot_prefix"`
|
|
Debug map[string]interface{}
|
|
}
|
|
|
|
if err = mapstructure.Decode(i, &asMap); err != nil {
|
|
err = errors.Wrap(err, "mapstructure error")
|
|
return nil, err
|
|
}
|
|
|
|
j = &PullJob{Name: name}
|
|
|
|
j.Connect, err = parseSSHStdinserverConnecter(asMap.Connect)
|
|
if err != nil {
|
|
err = errors.Wrap(err, "cannot parse 'connect'")
|
|
return nil, err
|
|
}
|
|
|
|
if j.Interval, err = parsePostitiveDuration(asMap.Interval); err != nil {
|
|
err = errors.Wrap(err, "cannot parse 'interval'")
|
|
return nil, err
|
|
}
|
|
|
|
j.Mapping, err = parseDatasetMapFilter(asMap.Mapping, false)
|
|
if err != nil {
|
|
err = errors.Wrap(err, "cannot parse 'mapping'")
|
|
return nil, err
|
|
}
|
|
|
|
if j.pruneFilter, err = j.Mapping.InvertedFilter(); err != nil {
|
|
err = errors.Wrap(err, "cannot automatically invert 'mapping' for prune job")
|
|
return nil, err
|
|
}
|
|
|
|
j.InitialReplPolicy, err = parseInitialReplPolicy(asMap.InitialReplPolicy, DEFAULT_INITIAL_REPL_POLICY)
|
|
if err != nil {
|
|
err = errors.Wrap(err, "cannot parse 'initial_repl_policy'")
|
|
return
|
|
}
|
|
|
|
if j.SnapshotPrefix, err = parseSnapshotPrefix(asMap.SnapshotPrefix); err != nil {
|
|
return
|
|
}
|
|
|
|
if j.Prune, err = parsePrunePolicy(asMap.Prune, false); err != nil {
|
|
err = errors.Wrap(err, "cannot parse prune policy")
|
|
return
|
|
}
|
|
|
|
if err = mapstructure.Decode(asMap.Debug, &j.Debug); err != nil {
|
|
err = errors.Wrap(err, "cannot parse 'debug'")
|
|
return
|
|
}
|
|
|
|
if j.Debug.Conn.ReadDump != "" || j.Debug.Conn.WriteDump != "" {
|
|
logConnecter := logNetConnConnecter{
|
|
Connecter: j.Connect,
|
|
ReadDump: j.Debug.Conn.ReadDump,
|
|
WriteDump: j.Debug.Conn.WriteDump,
|
|
}
|
|
j.Connect = logConnecter
|
|
}
|
|
|
|
return
|
|
}
|
|
|
|
func (j *PullJob) JobName() string {
|
|
return j.Name
|
|
}
|
|
|
|
func (j *PullJob) JobType() JobType { return JobTypePull }
|
|
|
|
func (j *PullJob) JobStart(ctx context.Context) {
|
|
|
|
log := ctx.Value(contextKeyLog).(Logger)
|
|
defer log.Info("exiting")
|
|
j.task = NewTask("main", j, log)
|
|
|
|
// j.task is idle here idle here
|
|
usr1 := make(chan os.Signal)
|
|
signal.Notify(usr1, syscall.SIGUSR1)
|
|
defer signal.Stop(usr1)
|
|
|
|
ticker := time.NewTicker(j.Interval)
|
|
for {
|
|
begin := time.Now()
|
|
j.doRun(ctx)
|
|
duration := time.Now().Sub(begin)
|
|
if duration > j.Interval {
|
|
j.task.Log().
|
|
WithField("actual_duration", duration).
|
|
WithField("configured_interval", j.Interval).
|
|
Warn("pull run took longer than configured interval")
|
|
}
|
|
select {
|
|
case <-ctx.Done():
|
|
j.task.Log().WithError(ctx.Err()).Info("context")
|
|
return
|
|
case <-ticker.C:
|
|
case <-usr1:
|
|
}
|
|
}
|
|
}
|
|
|
|
var STREAMRPC_CONFIG = &streamrpc.ConnConfig{ // FIXME oversight and configurability
|
|
RxHeaderMaxLen: 4096,
|
|
RxStructuredMaxLen: 4096 * 4096,
|
|
RxStreamMaxChunkSize: 4096 * 4096,
|
|
TxChunkSize: 4096 * 4096,
|
|
RxTimeout: streamrpc.Timeout{
|
|
Progress: 10 * time.Second,
|
|
},
|
|
TxTimeout: streamrpc.Timeout{
|
|
Progress: 10 * time.Second,
|
|
},
|
|
}
|
|
|
|
|
|
func (j *PullJob) doRun(ctx context.Context) {
|
|
|
|
j.task.Enter("run")
|
|
defer j.task.Finish()
|
|
|
|
// FIXME
|
|
clientConf := &streamrpc.ClientConfig{
|
|
ConnConfig: STREAMRPC_CONFIG,
|
|
}
|
|
|
|
//client, err := streamrpc.NewClient(j.Connect, clientConf)
|
|
client, err := streamrpc.NewClient(&tcpConnecter{net.Dialer{
|
|
Timeout: 10*time.Second,
|
|
}}, clientConf)
|
|
defer client.Close()
|
|
|
|
j.task.Enter("pull")
|
|
|
|
sender := RemoteEndpoint{client}
|
|
|
|
puller, err := NewReceiverEndpoint(
|
|
j.Mapping,
|
|
NewPrefixFilter(j.SnapshotPrefix),
|
|
)
|
|
if err != nil {
|
|
j.task.Log().WithError(err).Error("error creating receiver endpoint")
|
|
j.task.Finish()
|
|
return
|
|
}
|
|
|
|
usr2 := make(chan os.Signal)
|
|
defer close(usr2)
|
|
signal.Notify(usr2, syscall.SIGUSR2)
|
|
defer signal.Stop(usr2)
|
|
retryNow := make(chan struct{}, 1) // buffered so we don't leak the goroutine
|
|
go func() {
|
|
for {
|
|
sig := <-usr2
|
|
if sig != nil {
|
|
retryNow <- struct{}{}
|
|
} else {
|
|
break
|
|
}
|
|
}
|
|
}()
|
|
|
|
ctx = replication.ContextWithLogger(ctx, replicationLogAdaptor{j.task.Log().WithField("subsystem", "replication")})
|
|
ctx = streamrpc.ContextWithLogger(ctx, streamrpcLogAdaptor{j.task.Log().WithField("subsystem", "rpc.protocol")})
|
|
ctx = context.WithValue(ctx, contextKeyLog, j.task.Log().WithField("subsystem", "rpc.endpoint"))
|
|
replication.Replicate(ctx, replication.NewEndpointPairPull(sender, puller), retryNow)
|
|
|
|
client.Close()
|
|
j.task.Finish()
|
|
|
|
j.task.Enter("prune")
|
|
pruner, err := j.Pruner(j.task, PrunePolicySideDefault, false)
|
|
if err != nil {
|
|
j.task.Log().WithError(err).Error("error creating pruner")
|
|
} else {
|
|
pruner.Run(ctx)
|
|
}
|
|
j.task.Finish()
|
|
|
|
}
|
|
|
|
func (j *PullJob) JobStatus(ctxt context.Context) (*JobStatus, error) {
|
|
return &JobStatus{Tasks: []*TaskStatus{j.task.Status()}}, nil
|
|
}
|
|
|
|
func (j *PullJob) Pruner(task *Task, side PrunePolicySide, dryRun bool) (p Pruner, err error) {
|
|
p = Pruner{
|
|
task,
|
|
time.Now(),
|
|
dryRun,
|
|
j.pruneFilter,
|
|
j.SnapshotPrefix,
|
|
j.Prune,
|
|
}
|
|
return
|
|
}
|
|
|
|
func closeRPCWithTimeout(task *Task, remote RemoteEndpoint, timeout time.Duration, goodbye string) {
|
|
|
|
task.Log().Info("closing rpc connection")
|
|
|
|
ch := make(chan error)
|
|
go func() {
|
|
remote.Close()
|
|
ch <- nil
|
|
close(ch)
|
|
}()
|
|
|
|
var err error
|
|
select {
|
|
case <-time.After(timeout):
|
|
err = fmt.Errorf("timeout exceeded (%s)", timeout)
|
|
case closeRequestErr := <-ch:
|
|
err = closeRequestErr
|
|
}
|
|
|
|
if err != nil {
|
|
task.Log().WithError(err).Error("error closing connection")
|
|
}
|
|
return
|
|
}
|