2019-09-06 17:14:03 +01:00
|
|
|
// Copyright (C) 2019 Storj Labs, Inc.
|
|
|
|
// See LICENSE for copying information.
|
|
|
|
|
|
|
|
package contact
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
2019-11-04 21:03:21 +00:00
|
|
|
"sync"
|
2019-09-06 17:14:03 +01:00
|
|
|
"time"
|
|
|
|
|
|
|
|
"go.uber.org/zap"
|
|
|
|
"golang.org/x/sync/errgroup"
|
|
|
|
|
2019-12-27 11:48:47 +00:00
|
|
|
"storj.io/common/storj"
|
|
|
|
"storj.io/common/sync2"
|
2019-09-06 17:14:03 +01:00
|
|
|
)
|
|
|
|
|
|
|
|
// Chore is the contact chore for nodes announcing themselves to their trusted satellites
|
2019-09-10 14:24:16 +01:00
|
|
|
//
|
|
|
|
// architecture: Chore
|
2019-09-06 17:14:03 +01:00
|
|
|
type Chore struct {
|
2019-09-19 05:46:39 +01:00
|
|
|
log *zap.Logger
|
|
|
|
service *Service
|
2019-09-06 17:14:03 +01:00
|
|
|
|
2019-11-04 21:03:21 +00:00
|
|
|
mu sync.Mutex
|
2019-11-16 00:59:32 +00:00
|
|
|
cycles map[storj.NodeID]*sync2.Cycle
|
2019-11-04 21:03:21 +00:00
|
|
|
started sync2.Fence
|
|
|
|
interval time.Duration
|
2019-09-06 17:14:03 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// NewChore creates a new contact chore
|
2020-02-26 02:39:44 +00:00
|
|
|
func NewChore(log *zap.Logger, interval time.Duration, service *Service) *Chore {
|
2019-09-06 17:14:03 +01:00
|
|
|
return &Chore{
|
2019-09-19 05:46:39 +01:00
|
|
|
log: log,
|
|
|
|
service: service,
|
2019-09-06 17:14:03 +01:00
|
|
|
|
2019-11-16 00:59:32 +00:00
|
|
|
cycles: make(map[storj.NodeID]*sync2.Cycle),
|
2019-11-04 21:03:21 +00:00
|
|
|
interval: interval,
|
2019-09-06 17:14:03 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Run the contact chore on a regular interval with jitter
|
|
|
|
func (chore *Chore) Run(ctx context.Context) (err error) {
|
|
|
|
defer mon.Task()(&ctx)(&err)
|
2019-11-04 21:03:21 +00:00
|
|
|
var group errgroup.Group
|
|
|
|
|
2019-10-28 14:04:31 +00:00
|
|
|
if !chore.service.initialized.Wait(ctx) {
|
|
|
|
return ctx.Err()
|
2019-10-26 18:16:25 +01:00
|
|
|
}
|
|
|
|
|
2019-11-16 00:59:32 +00:00
|
|
|
// configure the satellite ping cycles
|
2020-02-26 02:39:44 +00:00
|
|
|
chore.updateCycles(ctx, &group, chore.service.trust.GetSatellites(ctx))
|
2019-11-16 00:59:32 +00:00
|
|
|
|
|
|
|
// set up a cycle to update ping cycles on a frequent interval
|
|
|
|
refreshCycle := sync2.NewCycle(time.Minute)
|
|
|
|
refreshCycle.Start(ctx, &group, func(ctx context.Context) error {
|
2020-02-26 02:39:44 +00:00
|
|
|
chore.updateCycles(ctx, &group, chore.service.trust.GetSatellites(ctx))
|
2019-11-16 00:59:32 +00:00
|
|
|
return nil
|
|
|
|
})
|
|
|
|
|
|
|
|
defer refreshCycle.Close()
|
|
|
|
|
|
|
|
chore.started.Release()
|
|
|
|
return group.Wait()
|
|
|
|
}
|
|
|
|
|
|
|
|
func (chore *Chore) updateCycles(ctx context.Context, group *errgroup.Group, satellites []storj.NodeID) {
|
2019-11-04 21:03:21 +00:00
|
|
|
chore.mu.Lock()
|
2019-11-16 00:59:32 +00:00
|
|
|
defer chore.mu.Unlock()
|
|
|
|
|
|
|
|
trustedIDs := make(map[storj.NodeID]struct{})
|
|
|
|
|
|
|
|
for _, satellite := range satellites {
|
|
|
|
satellite := satellite // alias the loop var since it is captured below
|
2019-11-04 21:03:21 +00:00
|
|
|
|
2019-11-16 00:59:32 +00:00
|
|
|
trustedIDs[satellite] = struct{}{}
|
|
|
|
if _, ok := chore.cycles[satellite]; ok {
|
|
|
|
// Ping cycle has already been started for this satellite
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
// Set up a new ping cycle for the newly trusted satellite
|
|
|
|
chore.log.Debug("Starting cycle", zap.Stringer("Satellite ID", satellite))
|
2019-11-04 21:03:21 +00:00
|
|
|
cycle := sync2.NewCycle(chore.interval)
|
2019-11-16 00:59:32 +00:00
|
|
|
chore.cycles[satellite] = cycle
|
|
|
|
cycle.Start(ctx, group, func(ctx context.Context) error {
|
2020-02-26 02:39:44 +00:00
|
|
|
return chore.service.pingSatellite(ctx, satellite, chore.interval)
|
2019-11-04 21:03:21 +00:00
|
|
|
})
|
|
|
|
}
|
2019-11-16 00:59:32 +00:00
|
|
|
|
|
|
|
// Stop the ping cycle for satellites that are no longer trusted
|
|
|
|
for satellite, cycle := range chore.cycles {
|
|
|
|
if _, ok := trustedIDs[satellite]; !ok {
|
|
|
|
chore.log.Debug("Stopping cycle", zap.Stringer("Satellite ID", satellite))
|
|
|
|
cycle.Close()
|
|
|
|
delete(chore.cycles, satellite)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-11-04 21:03:21 +00:00
|
|
|
// Pause stops all the cycles in the contact chore.
|
2020-02-19 18:32:53 +00:00
|
|
|
func (chore *Chore) Pause(ctx context.Context) {
|
|
|
|
chore.started.Wait(ctx)
|
2019-11-04 21:03:21 +00:00
|
|
|
chore.mu.Lock()
|
|
|
|
defer chore.mu.Unlock()
|
|
|
|
for _, cycle := range chore.cycles {
|
|
|
|
cycle.Pause()
|
|
|
|
}
|
2020-02-12 21:08:28 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Trigger ensures that each cycle is done at least once.
|
|
|
|
// If the cycle is currently running it waits for the previous to complete and then runs.
|
2020-02-19 18:32:53 +00:00
|
|
|
func (chore *Chore) Trigger(ctx context.Context) {
|
|
|
|
chore.started.Wait(ctx)
|
2020-02-12 21:08:28 +00:00
|
|
|
chore.mu.Lock()
|
|
|
|
defer chore.mu.Unlock()
|
|
|
|
for _, cycle := range chore.cycles {
|
|
|
|
cycle := cycle
|
|
|
|
go func() {
|
|
|
|
cycle.Trigger()
|
|
|
|
}()
|
|
|
|
}
|
2019-11-04 21:03:21 +00:00
|
|
|
}
|
2019-09-06 17:14:03 +01:00
|
|
|
|
2019-11-04 21:03:21 +00:00
|
|
|
// TriggerWait ensures that each cycle is done at least once and waits for completion.
|
|
|
|
// If the cycle is currently running it waits for the previous to complete and then runs.
|
2020-02-19 18:32:53 +00:00
|
|
|
func (chore *Chore) TriggerWait(ctx context.Context) {
|
|
|
|
chore.started.Wait(ctx)
|
2019-11-04 21:03:21 +00:00
|
|
|
chore.mu.Lock()
|
|
|
|
defer chore.mu.Unlock()
|
|
|
|
var group errgroup.Group
|
|
|
|
for _, cycle := range chore.cycles {
|
|
|
|
cycle := cycle
|
|
|
|
group.Go(func() error {
|
|
|
|
cycle.TriggerWait()
|
|
|
|
return nil
|
2019-09-06 17:14:03 +01:00
|
|
|
})
|
|
|
|
}
|
2020-02-19 18:32:53 +00:00
|
|
|
_ = group.Wait() // goroutines aren't returning any errors
|
2019-09-06 17:14:03 +01:00
|
|
|
}
|
|
|
|
|
2019-11-04 21:03:21 +00:00
|
|
|
// Close stops all the cycles in the contact chore.
|
2019-09-06 17:14:03 +01:00
|
|
|
func (chore *Chore) Close() error {
|
2019-11-04 21:03:21 +00:00
|
|
|
chore.mu.Lock()
|
|
|
|
defer chore.mu.Unlock()
|
|
|
|
for _, cycle := range chore.cycles {
|
|
|
|
cycle.Close()
|
|
|
|
}
|
|
|
|
chore.cycles = nil
|
2019-09-06 17:14:03 +01:00
|
|
|
return nil
|
|
|
|
}
|