2018-10-10 19:25:46 +01:00
|
|
|
// Copyright (C) 2018 Storj Labs, Inc.
|
|
|
|
// See LICENSE for copying information.
|
|
|
|
|
|
|
|
package audit
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
2018-10-16 21:02:18 +01:00
|
|
|
"time"
|
|
|
|
|
|
|
|
"go.uber.org/zap"
|
2018-10-10 19:25:46 +01:00
|
|
|
|
|
|
|
"storj.io/storj/pkg/overlay"
|
2019-01-10 16:35:18 +00:00
|
|
|
"storj.io/storj/pkg/pointerdb"
|
2018-10-10 19:25:46 +01:00
|
|
|
"storj.io/storj/pkg/provider"
|
|
|
|
"storj.io/storj/pkg/transport"
|
|
|
|
)
|
|
|
|
|
|
|
|
// Service helps coordinate Cursor and Verifier to run the audit process continuously
|
|
|
|
type Service struct {
|
2019-01-10 16:35:18 +00:00
|
|
|
log *zap.Logger
|
2018-10-10 19:25:46 +01:00
|
|
|
Cursor *Cursor
|
|
|
|
Verifier *Verifier
|
2018-10-16 18:40:34 +01:00
|
|
|
Reporter reporter
|
2018-11-01 14:03:45 +00:00
|
|
|
ticker *time.Ticker
|
2018-10-16 18:40:34 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// Config contains configurable values for audit service
|
|
|
|
type Config struct {
|
2019-01-02 18:07:49 +00:00
|
|
|
APIKey string `help:"APIKey to access the statdb" default:""`
|
2018-11-07 01:16:43 +00:00
|
|
|
SatelliteAddr string `help:"address to contact services on the satellite"`
|
|
|
|
MaxRetriesStatDB int `help:"max number of times to attempt updating a statdb batch" default:"3"`
|
|
|
|
Interval time.Duration `help:"how frequently segments are audited" default:"30s"`
|
2018-10-16 21:02:18 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// Run runs the repairer with the configured values
|
|
|
|
func (c Config) Run(ctx context.Context, server *provider.Provider) (err error) {
|
2018-11-07 01:16:43 +00:00
|
|
|
identity := server.Identity()
|
2019-01-10 16:35:18 +00:00
|
|
|
pointers := pointerdb.LoadFromContext(ctx)
|
2019-01-11 12:45:11 +00:00
|
|
|
if pointers == nil {
|
|
|
|
return Error.New("programmer error: pointerdb responsibility unstarted")
|
2018-10-16 21:02:18 +01:00
|
|
|
}
|
2019-01-11 12:45:11 +00:00
|
|
|
|
2018-12-20 13:57:54 +00:00
|
|
|
overlay, err := overlay.NewClient(identity, c.SatelliteAddr)
|
2018-11-07 01:16:43 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
transport := transport.NewClient(identity)
|
2019-01-10 16:35:18 +00:00
|
|
|
|
|
|
|
log := zap.L()
|
|
|
|
service, err := NewService(ctx, log, c.SatelliteAddr, c.Interval, c.MaxRetriesStatDB, pointers, transport, overlay, *identity, c.APIKey)
|
2018-11-07 01:16:43 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
go func() {
|
|
|
|
err := service.Run(ctx)
|
2019-01-10 16:35:18 +00:00
|
|
|
service.log.Error("audit service failed to run:", zap.Error(err))
|
2018-11-07 01:16:43 +00:00
|
|
|
}()
|
|
|
|
return server.Run(ctx)
|
2018-10-10 19:25:46 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// NewService instantiates a Service with access to a Cursor and Verifier
|
2019-01-10 16:35:18 +00:00
|
|
|
func NewService(ctx context.Context, log *zap.Logger, statDBPort string, interval time.Duration, maxRetries int, pointers *pointerdb.Server, transport transport.Client, overlay overlay.Client,
|
2018-11-07 01:16:43 +00:00
|
|
|
identity provider.FullIdentity, apiKey string) (service *Service, err error) {
|
2019-01-18 13:54:08 +00:00
|
|
|
|
|
|
|
//TODO: instead of statDBPort pass in the actual database interface
|
2018-10-10 19:25:46 +01:00
|
|
|
cursor := NewCursor(pointers)
|
2018-11-07 01:16:43 +00:00
|
|
|
verifier := NewVerifier(transport, overlay, identity)
|
|
|
|
reporter, err := NewReporter(ctx, statDBPort, maxRetries, apiKey)
|
2018-10-16 18:40:34 +01:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2018-10-16 21:02:18 +01:00
|
|
|
|
2018-11-01 14:03:45 +00:00
|
|
|
return &Service{
|
2019-01-10 16:35:18 +00:00
|
|
|
log: log,
|
2018-11-01 14:03:45 +00:00
|
|
|
Cursor: cursor,
|
2018-10-16 21:02:18 +01:00
|
|
|
Verifier: verifier,
|
|
|
|
Reporter: reporter,
|
2018-11-01 14:03:45 +00:00
|
|
|
ticker: time.NewTicker(interval),
|
2018-10-16 21:02:18 +01:00
|
|
|
}, nil
|
2018-10-10 19:25:46 +01:00
|
|
|
}
|
|
|
|
|
2018-11-01 14:03:45 +00:00
|
|
|
// Run runs auditing service
|
|
|
|
func (service *Service) Run(ctx context.Context) (err error) {
|
2018-10-16 21:02:18 +01:00
|
|
|
defer mon.Task()(&ctx)(&err)
|
2019-01-10 16:35:18 +00:00
|
|
|
service.log.Info("Audit cron is starting up")
|
2018-11-01 14:03:45 +00:00
|
|
|
|
|
|
|
for {
|
|
|
|
err := service.process(ctx)
|
|
|
|
if err != nil {
|
2019-01-10 16:35:18 +00:00
|
|
|
service.log.Error("process", zap.Error(err))
|
2018-11-01 14:03:45 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
select {
|
|
|
|
case <-service.ticker.C:
|
|
|
|
case <-ctx.Done():
|
|
|
|
return ctx.Err()
|
2018-10-16 21:02:18 +01:00
|
|
|
}
|
2018-11-01 14:03:45 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// process picks a random stripe and verifies correctness
|
|
|
|
func (service *Service) process(ctx context.Context) error {
|
|
|
|
stripe, err := service.Cursor.NextStripe(ctx)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2018-11-07 01:16:43 +00:00
|
|
|
if stripe == nil {
|
2018-11-08 22:36:44 +00:00
|
|
|
return nil
|
2018-11-07 01:16:43 +00:00
|
|
|
}
|
2018-11-01 14:03:45 +00:00
|
|
|
|
2019-01-06 18:51:01 +00:00
|
|
|
verifiedNodes, err := service.Verifier.verify(ctx, stripe)
|
2018-11-01 14:03:45 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2018-12-19 18:44:03 +00:00
|
|
|
// TODO(moby) we need to decide if we want to do something with nodes that the reporter failed to update
|
|
|
|
_, err = service.Reporter.RecordAudits(ctx, verifiedNodes)
|
2018-11-01 14:03:45 +00:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2018-10-16 21:02:18 +01:00
|
|
|
|
2018-11-01 14:03:45 +00:00
|
|
|
return nil
|
2018-10-10 19:25:46 +01:00
|
|
|
}
|