mirror of
https://github.com/zrepl/zrepl.git
synced 2025-01-11 08:49:28 +01:00
524 lines
11 KiB
Go
524 lines
11 KiB
Go
package pruner
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
"github.com/pkg/errors"
|
|
"github.com/prometheus/client_golang/prometheus"
|
|
"github.com/zrepl/zrepl/config"
|
|
"github.com/zrepl/zrepl/logger"
|
|
"github.com/zrepl/zrepl/pruning"
|
|
"github.com/zrepl/zrepl/replication/pdu"
|
|
"net"
|
|
"sort"
|
|
"sync"
|
|
"time"
|
|
)
|
|
|
|
// Try to keep it compatible with gitub.com/zrepl/zrepl/replication.Endpoint
|
|
type History interface {
|
|
ReplicationCursor(ctx context.Context, req *pdu.ReplicationCursorReq) (*pdu.ReplicationCursorRes, error)
|
|
}
|
|
|
|
type Target interface {
|
|
ListFilesystems(ctx context.Context) ([]*pdu.Filesystem, error)
|
|
ListFilesystemVersions(ctx context.Context, fs string) ([]*pdu.FilesystemVersion, error) // fix depS
|
|
DestroySnapshots(ctx context.Context, req *pdu.DestroySnapshotsReq) (*pdu.DestroySnapshotsRes, error)
|
|
}
|
|
|
|
type Logger = logger.Logger
|
|
|
|
type contextKey int
|
|
|
|
const contextKeyLogger contextKey = 0
|
|
|
|
func WithLogger(ctx context.Context, log Logger) context.Context {
|
|
return context.WithValue(ctx, contextKeyLogger, log)
|
|
}
|
|
|
|
func GetLogger(ctx context.Context) Logger {
|
|
if l, ok := ctx.Value(contextKeyLogger).(Logger); ok {
|
|
return l
|
|
}
|
|
return logger.NewNullLogger()
|
|
}
|
|
|
|
type args struct {
|
|
ctx context.Context
|
|
target Target
|
|
receiver History
|
|
rules []pruning.KeepRule
|
|
retryWait time.Duration
|
|
considerSnapAtCursorReplicated bool
|
|
promPruneSecs prometheus.Observer
|
|
}
|
|
|
|
type Pruner struct {
|
|
args args
|
|
|
|
mtx sync.RWMutex
|
|
|
|
state State
|
|
|
|
// State ErrWait|ErrPerm
|
|
sleepUntil time.Time
|
|
err error
|
|
|
|
// State Exec
|
|
prunePending []*fs
|
|
pruneCompleted []*fs
|
|
}
|
|
|
|
type PrunerFactory struct {
|
|
senderRules []pruning.KeepRule
|
|
receiverRules []pruning.KeepRule
|
|
retryWait time.Duration
|
|
considerSnapAtCursorReplicated bool
|
|
promPruneSecs *prometheus.HistogramVec
|
|
}
|
|
|
|
func checkContainsKeep1(rules []pruning.KeepRule) error {
|
|
if len(rules) == 0 {
|
|
return nil //No keep rules means keep all - ok
|
|
}
|
|
for _, e := range rules {
|
|
switch e.(type) {
|
|
case *pruning.KeepLastN:
|
|
return nil
|
|
}
|
|
}
|
|
return errors.New("sender keep rules must contain last_n or be empty so that the last snapshot is definitely kept")
|
|
}
|
|
|
|
func NewPrunerFactory(in config.PruningSenderReceiver, promPruneSecs *prometheus.HistogramVec) (*PrunerFactory, error) {
|
|
keepRulesReceiver, err := pruning.RulesFromConfig(in.KeepReceiver)
|
|
if err != nil {
|
|
return nil, errors.Wrap(err, "cannot build receiver pruning rules")
|
|
}
|
|
|
|
keepRulesSender, err := pruning.RulesFromConfig(in.KeepSender)
|
|
if err != nil {
|
|
return nil, errors.Wrap(err, "cannot build sender pruning rules")
|
|
}
|
|
|
|
considerSnapAtCursorReplicated := false
|
|
for _, r := range in.KeepSender {
|
|
knr, ok := r.Ret.(*config.PruneKeepNotReplicated)
|
|
if !ok {
|
|
continue
|
|
}
|
|
considerSnapAtCursorReplicated = considerSnapAtCursorReplicated || !knr.KeepSnapshotAtCursor
|
|
}
|
|
f := &PrunerFactory{
|
|
keepRulesSender,
|
|
keepRulesReceiver,
|
|
10 * time.Second, //FIXME constant
|
|
considerSnapAtCursorReplicated,
|
|
promPruneSecs,
|
|
}
|
|
return f, nil
|
|
}
|
|
|
|
func (f *PrunerFactory) BuildSenderPruner(ctx context.Context, target Target, receiver History) *Pruner {
|
|
p := &Pruner{
|
|
args: args{
|
|
WithLogger(ctx, GetLogger(ctx).WithField("prune_side", "sender")),
|
|
target,
|
|
receiver,
|
|
f.senderRules,
|
|
f.retryWait,
|
|
f.considerSnapAtCursorReplicated,
|
|
f.promPruneSecs.WithLabelValues("sender"),
|
|
},
|
|
state: Plan,
|
|
}
|
|
return p
|
|
}
|
|
|
|
func (f *PrunerFactory) BuildReceiverPruner(ctx context.Context, target Target, receiver History) *Pruner {
|
|
p := &Pruner{
|
|
args: args{
|
|
WithLogger(ctx, GetLogger(ctx).WithField("prune_side", "receiver")),
|
|
target,
|
|
receiver,
|
|
f.receiverRules,
|
|
f.retryWait,
|
|
false, // senseless here anyways
|
|
f.promPruneSecs.WithLabelValues("receiver"),
|
|
},
|
|
state: Plan,
|
|
}
|
|
return p
|
|
}
|
|
|
|
//go:generate enumer -type=State
|
|
type State int
|
|
|
|
const (
|
|
Plan State = 1 << iota
|
|
PlanWait
|
|
Exec
|
|
ExecWait
|
|
ErrPerm
|
|
Done
|
|
)
|
|
|
|
func (s State) statefunc() state {
|
|
var statemap = map[State]state{
|
|
Plan: statePlan,
|
|
PlanWait: statePlanWait,
|
|
Exec: stateExec,
|
|
ExecWait: stateExecWait,
|
|
ErrPerm: nil,
|
|
Done: nil,
|
|
}
|
|
return statemap[s]
|
|
}
|
|
|
|
type updater func(func(*Pruner)) State
|
|
type state func(args *args, u updater) state
|
|
|
|
func (p *Pruner) Prune() {
|
|
p.prune(p.args)
|
|
}
|
|
|
|
func (p *Pruner) prune(args args) {
|
|
s := p.state.statefunc()
|
|
for s != nil {
|
|
pre := p.state
|
|
s = s(&args, func(f func(*Pruner)) State {
|
|
p.mtx.Lock()
|
|
defer p.mtx.Unlock()
|
|
f(p)
|
|
return p.state
|
|
})
|
|
post := p.state
|
|
GetLogger(args.ctx).
|
|
WithField("transition", fmt.Sprintf("%s=>%s", pre, post)).
|
|
Debug("state transition")
|
|
}
|
|
}
|
|
|
|
type Report struct {
|
|
State string
|
|
SleepUntil time.Time
|
|
Error string
|
|
Pending, Completed []FSReport
|
|
}
|
|
|
|
type FSReport struct {
|
|
Filesystem string
|
|
SnapshotList, DestroyList []SnapshotReport
|
|
Error string
|
|
}
|
|
|
|
type SnapshotReport struct {
|
|
Name string
|
|
Replicated bool
|
|
Date time.Time
|
|
}
|
|
|
|
func (p *Pruner) Report() *Report {
|
|
p.mtx.Lock()
|
|
defer p.mtx.Unlock()
|
|
|
|
r := Report{State: p.state.String()}
|
|
|
|
if p.state & PlanWait|ExecWait != 0 {
|
|
r.SleepUntil = p.sleepUntil
|
|
}
|
|
if p.state & PlanWait|ExecWait|ErrPerm != 0 {
|
|
if p.err != nil {
|
|
r.Error = p.err.Error()
|
|
}
|
|
}
|
|
|
|
if p.state & Plan|PlanWait == 0 {
|
|
return &r
|
|
}
|
|
|
|
r.Pending = make([]FSReport, len(p.prunePending))
|
|
for i, fs := range p.prunePending{
|
|
r.Pending[i] = fs.Report()
|
|
}
|
|
r.Completed = make([]FSReport, len(p.pruneCompleted))
|
|
for i, fs := range p.pruneCompleted{
|
|
r.Completed[i] = fs.Report()
|
|
}
|
|
|
|
return &r
|
|
}
|
|
|
|
type fs struct {
|
|
path string
|
|
|
|
// snapshots presented by target
|
|
// (type snapshot)
|
|
snaps []pruning.Snapshot
|
|
// destroy list returned by pruning.PruneSnapshots(snaps)
|
|
// (type snapshot)
|
|
destroyList []pruning.Snapshot
|
|
|
|
mtx sync.RWMutex
|
|
// for Plan
|
|
err error
|
|
}
|
|
|
|
func (f *fs) Update(err error) {
|
|
f.mtx.Lock()
|
|
defer f.mtx.Unlock()
|
|
f.err = err
|
|
}
|
|
|
|
func (f *fs) Report() FSReport {
|
|
f.mtx.Lock()
|
|
defer f.mtx.Unlock()
|
|
|
|
r := FSReport{}
|
|
r.Filesystem = f.path
|
|
if f.err != nil {
|
|
r.Error = f.err.Error()
|
|
}
|
|
|
|
r.SnapshotList = make([]SnapshotReport, len(f.snaps))
|
|
for i, snap := range f.snaps {
|
|
r.SnapshotList[i] = snap.(snapshot).Report()
|
|
}
|
|
|
|
r.DestroyList = make([]SnapshotReport, len(f.destroyList))
|
|
for i, snap := range f.destroyList{
|
|
r.DestroyList[i] = snap.(snapshot).Report()
|
|
}
|
|
|
|
return r
|
|
}
|
|
|
|
type snapshot struct {
|
|
replicated bool
|
|
date time.Time
|
|
fsv *pdu.FilesystemVersion
|
|
}
|
|
|
|
func (s snapshot) Report() SnapshotReport {
|
|
return SnapshotReport{
|
|
Name: s.Name(),
|
|
Replicated: s.Replicated(),
|
|
Date: s.Date(),
|
|
}
|
|
}
|
|
|
|
var _ pruning.Snapshot = snapshot{}
|
|
|
|
func (s snapshot) Name() string { return s.fsv.Name }
|
|
|
|
func (s snapshot) Replicated() bool { return s.replicated }
|
|
|
|
func (s snapshot) Date() time.Time { return s.date }
|
|
|
|
func shouldRetry(e error) bool {
|
|
switch e.(type) {
|
|
case nil:
|
|
return true
|
|
case net.Error:
|
|
return true
|
|
}
|
|
return false
|
|
}
|
|
|
|
func onErr(u updater, e error) state {
|
|
return u(func(p *Pruner) {
|
|
p.err = e
|
|
if !shouldRetry(e) {
|
|
p.state = ErrPerm
|
|
return
|
|
}
|
|
switch p.state {
|
|
case Plan:
|
|
p.state = PlanWait
|
|
case Exec:
|
|
p.state = ExecWait
|
|
default:
|
|
panic(p.state)
|
|
}
|
|
}).statefunc()
|
|
}
|
|
|
|
func statePlan(a *args, u updater) state {
|
|
|
|
ctx, target, receiver := a.ctx, a.target, a.receiver
|
|
|
|
tfss, err := target.ListFilesystems(ctx)
|
|
if err != nil {
|
|
return onErr(u, err)
|
|
}
|
|
|
|
pfss := make([]*fs, len(tfss))
|
|
fsloop:
|
|
for i, tfs := range tfss {
|
|
|
|
l := GetLogger(ctx).WithField("fs", tfs.Path)
|
|
l.Debug("plan filesystem")
|
|
|
|
|
|
pfs := &fs{
|
|
path: tfs.Path,
|
|
}
|
|
pfss[i] = pfs
|
|
|
|
tfsvs, err := target.ListFilesystemVersions(ctx, tfs.Path)
|
|
if err != nil {
|
|
l.WithError(err).Error("cannot list filesystem versions")
|
|
if shouldRetry(err) {
|
|
return onErr(u, err)
|
|
}
|
|
pfs.err = err
|
|
continue fsloop
|
|
}
|
|
pfs.snaps = make([]pruning.Snapshot, 0, len(tfsvs))
|
|
|
|
rcReq := &pdu.ReplicationCursorReq{
|
|
Filesystem: tfs.Path,
|
|
Op: &pdu.ReplicationCursorReq_Get{
|
|
Get: &pdu.ReplicationCursorReq_GetOp{},
|
|
},
|
|
}
|
|
rc, err := receiver.ReplicationCursor(ctx, rcReq)
|
|
if err != nil {
|
|
l.WithError(err).Error("cannot get replication cursor")
|
|
if shouldRetry(err) {
|
|
return onErr(u, err)
|
|
}
|
|
pfs.err = err
|
|
continue fsloop
|
|
}
|
|
if rc.GetError() != "" {
|
|
l.WithField("reqErr", rc.GetError()).Error("cannot get replication cursor")
|
|
pfs.err = fmt.Errorf("%s", rc.GetError())
|
|
continue fsloop
|
|
}
|
|
|
|
|
|
// scan from older to newer, all snapshots older than cursor are interpreted as replicated
|
|
sort.Slice(tfsvs, func(i, j int) bool {
|
|
return tfsvs[i].CreateTXG < tfsvs[j].CreateTXG
|
|
})
|
|
|
|
haveCursorSnapshot := false
|
|
for _, tfsv := range tfsvs {
|
|
if tfsv.Type != pdu.FilesystemVersion_Snapshot {
|
|
continue
|
|
}
|
|
if tfsv.Guid == rc.GetGuid() {
|
|
haveCursorSnapshot = true
|
|
}
|
|
}
|
|
preCursor := haveCursorSnapshot
|
|
for _, tfsv := range tfsvs {
|
|
if tfsv.Type != pdu.FilesystemVersion_Snapshot {
|
|
continue
|
|
}
|
|
creation, err := tfsv.CreationAsTime()
|
|
if err != nil {
|
|
pfs.err = fmt.Errorf("%s%s has invalid creation date: %s", tfs, tfsv.RelName(), err)
|
|
l.WithError(pfs.err).Error("")
|
|
continue fsloop
|
|
}
|
|
// note that we cannot use CreateTXG because target and receiver could be on different pools
|
|
atCursor := tfsv.Guid == rc.GetGuid()
|
|
preCursor = preCursor && !atCursor
|
|
pfs.snaps = append(pfs.snaps, snapshot{
|
|
replicated: preCursor || (a.considerSnapAtCursorReplicated && atCursor),
|
|
date: creation,
|
|
fsv: tfsv,
|
|
})
|
|
}
|
|
if preCursor {
|
|
pfs.err = fmt.Errorf("replication cursor not found in prune target filesystem versions")
|
|
l.WithError(pfs.err).Error("")
|
|
continue fsloop
|
|
}
|
|
|
|
// Apply prune rules
|
|
pfs.destroyList = pruning.PruneSnapshots(pfs.snaps, a.rules)
|
|
|
|
}
|
|
|
|
return u(func(pruner *Pruner) {
|
|
for _, pfs := range pfss {
|
|
if pfs.err != nil {
|
|
pruner.pruneCompleted = append(pruner.pruneCompleted, pfs)
|
|
} else {
|
|
pruner.prunePending = append(pruner.prunePending, pfs)
|
|
}
|
|
}
|
|
pruner.state = Exec
|
|
}).statefunc()
|
|
}
|
|
|
|
func stateExec(a *args, u updater) state {
|
|
|
|
var pfs *fs
|
|
state := u(func(pruner *Pruner) {
|
|
if len(pruner.prunePending) == 0 {
|
|
nextState := Done
|
|
for _, pfs := range pruner.pruneCompleted {
|
|
if pfs.err != nil {
|
|
nextState = ErrPerm
|
|
}
|
|
}
|
|
pruner.state = nextState
|
|
return
|
|
}
|
|
pfs = pruner.prunePending[0]
|
|
})
|
|
if state != Exec {
|
|
return state.statefunc()
|
|
}
|
|
|
|
destroyList := make([]*pdu.FilesystemVersion, len(pfs.destroyList))
|
|
for i := range destroyList {
|
|
destroyList[i] = pfs.destroyList[i].(snapshot).fsv
|
|
GetLogger(a.ctx).
|
|
WithField("fs", pfs.path).
|
|
WithField("destroy_snap", destroyList[i].Name).
|
|
Debug("policy destroys snapshot")
|
|
}
|
|
pfs.Update(nil)
|
|
req := pdu.DestroySnapshotsReq{
|
|
Filesystem: pfs.path,
|
|
Snapshots: destroyList,
|
|
}
|
|
_, err := a.target.DestroySnapshots(a.ctx, &req)
|
|
pfs.Update(err)
|
|
if err != nil && shouldRetry(err) {
|
|
return onErr(u, err)
|
|
}
|
|
// if it's not retryable, treat is like as being done
|
|
|
|
return u(func(pruner *Pruner) {
|
|
pruner.pruneCompleted = append(pruner.pruneCompleted, pfs)
|
|
pruner.prunePending = pruner.prunePending[1:]
|
|
}).statefunc()
|
|
}
|
|
|
|
func stateExecWait(a *args, u updater) state {
|
|
return doWait(Exec, a, u)
|
|
}
|
|
|
|
func statePlanWait(a *args, u updater) state {
|
|
return doWait(Plan, a, u)
|
|
}
|
|
|
|
func doWait(goback State, a *args, u updater) state {
|
|
timer := time.NewTimer(a.retryWait)
|
|
defer timer.Stop()
|
|
select {
|
|
case <-timer.C:
|
|
return u(func(pruner *Pruner) {
|
|
pruner.state = goback
|
|
}).statefunc()
|
|
case <-a.ctx.Done():
|
|
return onErr(u, a.ctx.Err())
|
|
}
|
|
}
|