mirror of
https://github.com/zrepl/zrepl.git
synced 2025-01-03 12:58:57 +01:00
10a14a8c50
package trace: - introduce the concept of tasks and spans, tracked as linked list within ctx - see package-level docs for an overview of the concepts - **main feature 1**: unique stack of task and span IDs - makes it easy to follow a series of log entries in concurrent code - **main feature 2**: ability to produce a chrome://tracing-compatible trace file - either via an env variable or a `zrepl pprof` subcommand - this is not a CPU profile, we already have go pprof for that - but it is very useful to visually inspect where the replication / snapshotter / pruner spends its time ( fixes #307 ) usage in package daemon/logging: - goal: every log entry should have a trace field with the ID stack from package trace - make `logging.GetLogger(ctx, Subsys)` the authoritative `logger.Logger` factory function - the context carries a linked list of injected fields which `logging.GetLogger` adds to the logger it returns - `logging.GetLogger` also uses package `trace` to get the task-and-span-stack and injects it into the returned logger's fields
133 lines
4.6 KiB
Go
133 lines
4.6 KiB
Go
package rpc
|
|
|
|
import (
|
|
"context"
|
|
"time"
|
|
|
|
"github.com/zrepl/zrepl/endpoint"
|
|
"github.com/zrepl/zrepl/replication/logic/pdu"
|
|
"github.com/zrepl/zrepl/rpc/dataconn"
|
|
"github.com/zrepl/zrepl/rpc/grpcclientidentity"
|
|
"github.com/zrepl/zrepl/rpc/grpcclientidentity/grpchelper"
|
|
"github.com/zrepl/zrepl/rpc/versionhandshake"
|
|
"github.com/zrepl/zrepl/transport"
|
|
"github.com/zrepl/zrepl/util/envconst"
|
|
)
|
|
|
|
type Handler interface {
|
|
pdu.ReplicationServer
|
|
dataconn.Handler
|
|
}
|
|
|
|
type serveFunc func(ctx context.Context, demuxedListener transport.AuthenticatedListener, errOut chan<- error)
|
|
|
|
// Server abstracts the accept and request routing infrastructure for the
|
|
// passive side of a replication setup.
|
|
type Server struct {
|
|
logger Logger
|
|
handler Handler
|
|
controlServerServe serveFunc
|
|
dataServer *dataconn.Server
|
|
dataServerServe serveFunc
|
|
}
|
|
|
|
type HandlerContextInterceptorData interface {
|
|
FullMethod() string
|
|
ClientIdentity() string
|
|
}
|
|
|
|
type interceptorData struct {
|
|
prefixMethod string
|
|
wrapped HandlerContextInterceptorData
|
|
}
|
|
|
|
func (d interceptorData) ClientIdentity() string { return d.wrapped.ClientIdentity() }
|
|
func (d interceptorData) FullMethod() string { return d.prefixMethod + d.wrapped.FullMethod() }
|
|
|
|
type HandlerContextInterceptor func(ctx context.Context, data HandlerContextInterceptorData, handler func(ctx context.Context))
|
|
|
|
// config must be valid (use its Validate function).
|
|
func NewServer(handler Handler, loggers Loggers, ctxInterceptor HandlerContextInterceptor) *Server {
|
|
|
|
// setup control server
|
|
controlServerServe := func(ctx context.Context, controlListener transport.AuthenticatedListener, errOut chan<- error) {
|
|
|
|
var controlCtxInterceptor grpcclientidentity.Interceptor = func(ctx context.Context, data grpcclientidentity.ContextInterceptorData, handler func(ctx context.Context)) {
|
|
ctxInterceptor(ctx, interceptorData{"control://", data}, handler)
|
|
}
|
|
controlServer, serve := grpchelper.NewServer(controlListener, endpoint.ClientIdentityKey, loggers.Control, controlCtxInterceptor)
|
|
pdu.RegisterReplicationServer(controlServer, handler)
|
|
|
|
// give time for graceful stop until deadline expires, then hard stop
|
|
go func() {
|
|
<-ctx.Done()
|
|
if dl, ok := ctx.Deadline(); ok {
|
|
go time.AfterFunc(dl.Sub(dl), controlServer.Stop)
|
|
}
|
|
loggers.Control.Debug("gracefully shutting down control server")
|
|
controlServer.GracefulStop()
|
|
loggers.Control.Debug("gracdeful shut down of control server complete")
|
|
}()
|
|
|
|
errOut <- serve()
|
|
}
|
|
|
|
// setup data server
|
|
dataServerClientIdentitySetter := func(ctx context.Context, wire *transport.AuthConn) (context.Context, *transport.AuthConn) {
|
|
ci := wire.ClientIdentity()
|
|
ctx = context.WithValue(ctx, endpoint.ClientIdentityKey, ci)
|
|
return ctx, wire
|
|
}
|
|
var dataCtxInterceptor dataconn.ContextInterceptor = func(ctx context.Context, data dataconn.ContextInterceptorData, handler func(ctx context.Context)) {
|
|
ctxInterceptor(ctx, interceptorData{"data://", data}, handler)
|
|
}
|
|
dataServer := dataconn.NewServer(dataServerClientIdentitySetter, dataCtxInterceptor, loggers.Data, handler)
|
|
dataServerServe := func(ctx context.Context, dataListener transport.AuthenticatedListener, errOut chan<- error) {
|
|
dataServer.Serve(ctx, dataListener)
|
|
errOut <- nil // TODO bad design of dataServer?
|
|
}
|
|
|
|
server := &Server{
|
|
logger: loggers.General,
|
|
handler: handler,
|
|
controlServerServe: controlServerServe,
|
|
dataServer: dataServer,
|
|
dataServerServe: dataServerServe,
|
|
}
|
|
|
|
return server
|
|
}
|
|
|
|
// The context is used for cancellation only.
|
|
// Serve never returns an error, it logs them to the Server's logger.
|
|
func (s *Server) Serve(ctx context.Context, l transport.AuthenticatedListener) {
|
|
ctx, cancel := context.WithCancel(ctx)
|
|
defer cancel()
|
|
defer s.logger.Debug("rpc.(*Server).Serve done")
|
|
|
|
l = versionhandshake.Listener(l, envconst.Duration("ZREPL_RPC_SERVER_VERSIONHANDSHAKE_TIMEOUT", 10*time.Second))
|
|
|
|
// it is important that demux's context is cancelled,
|
|
// it has background goroutines attached
|
|
demuxListener := demux(ctx, l)
|
|
|
|
serveErrors := make(chan error, 2)
|
|
go s.controlServerServe(ctx, demuxListener.control, serveErrors)
|
|
go s.dataServerServe(ctx, demuxListener.data, serveErrors)
|
|
select {
|
|
case serveErr := <-serveErrors:
|
|
s.logger.WithError(serveErr).Error("serve error")
|
|
s.logger.Debug("wait for other server to shut down")
|
|
cancel()
|
|
secondServeErr := <-serveErrors
|
|
s.logger.WithError(secondServeErr).Error("serve error")
|
|
case <-ctx.Done():
|
|
s.logger.Debug("context cancelled, wait for control and data servers")
|
|
cancel()
|
|
for i := 0; i < 2; i++ {
|
|
<-serveErrors
|
|
}
|
|
s.logger.Debug("control and data server shut down, returning from Serve")
|
|
}
|
|
}
|