2019-01-24 20:15:10 +00:00
|
|
|
// Copyright (C) 2019 Storj Labs, Inc.
|
2018-06-13 19:22:32 +01:00
|
|
|
// See LICENSE for copying information.
|
|
|
|
|
2018-11-19 14:40:01 +00:00
|
|
|
package overlay_test
|
2018-06-13 19:22:32 +01:00
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
2020-04-29 18:58:41 +01:00
|
|
|
"fmt"
|
2020-03-13 18:01:48 +00:00
|
|
|
"reflect"
|
2019-12-16 13:45:13 +00:00
|
|
|
"sort"
|
2018-06-13 19:22:32 +01:00
|
|
|
"testing"
|
2019-04-26 13:15:06 +01:00
|
|
|
"time"
|
2018-06-13 19:22:32 +01:00
|
|
|
|
|
|
|
"github.com/stretchr/testify/assert"
|
2019-02-09 21:17:49 +00:00
|
|
|
"github.com/stretchr/testify/require"
|
2020-04-24 20:34:53 +01:00
|
|
|
"go.uber.org/zap"
|
2019-03-23 08:06:11 +00:00
|
|
|
"go.uber.org/zap/zaptest"
|
2020-06-08 16:27:08 +01:00
|
|
|
"golang.org/x/sync/errgroup"
|
2019-02-06 13:32:42 +00:00
|
|
|
|
2020-04-24 20:34:53 +01:00
|
|
|
"storj.io/common/memory"
|
2019-12-27 11:48:47 +00:00
|
|
|
"storj.io/common/pb"
|
|
|
|
"storj.io/common/storj"
|
|
|
|
"storj.io/common/testcontext"
|
|
|
|
"storj.io/common/testrand"
|
2019-11-14 19:46:15 +00:00
|
|
|
"storj.io/storj/private/testplanet"
|
2018-12-27 09:56:25 +00:00
|
|
|
"storj.io/storj/satellite"
|
2019-07-28 06:55:36 +01:00
|
|
|
"storj.io/storj/satellite/overlay"
|
2018-12-17 20:14:16 +00:00
|
|
|
"storj.io/storj/satellite/satellitedb/satellitedbtest"
|
2018-06-13 19:22:32 +01:00
|
|
|
)
|
|
|
|
|
2019-01-15 16:08:45 +00:00
|
|
|
func TestCache_Database(t *testing.T) {
|
2019-02-06 13:32:42 +00:00
|
|
|
t.Parallel()
|
|
|
|
|
2020-01-19 16:29:15 +00:00
|
|
|
satellitedbtest.Run(t, func(ctx *testcontext.Context, t *testing.T, db satellite.DB) {
|
2019-03-25 22:25:09 +00:00
|
|
|
testCache(ctx, t, db.OverlayCache())
|
2019-01-15 16:08:45 +00:00
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2020-07-16 15:18:02 +01:00
|
|
|
// returns a NodeSelectionConfig with sensible test values.
|
2020-07-08 15:28:49 +01:00
|
|
|
func testNodeSelectionConfig(newNodeFraction float64, distinctIP bool) overlay.NodeSelectionConfig {
|
2019-06-13 17:06:37 +01:00
|
|
|
return overlay.NodeSelectionConfig{
|
2020-07-08 15:28:49 +01:00
|
|
|
AuditCount: 0,
|
2020-03-18 21:16:13 +00:00
|
|
|
NewNodeFraction: newNodeFraction,
|
|
|
|
OnlineWindow: time.Hour,
|
|
|
|
DistinctIP: distinctIP,
|
2019-06-13 22:51:18 +01:00
|
|
|
|
2020-01-03 00:00:18 +00:00
|
|
|
AuditReputationRepairWeight: 1,
|
|
|
|
AuditReputationUplinkWeight: 1,
|
|
|
|
AuditReputationLambda: 1,
|
|
|
|
AuditReputationWeight: 1,
|
|
|
|
AuditReputationDQ: 0.5,
|
2019-06-13 17:06:37 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-08-04 21:28:46 +01:00
|
|
|
// returns an AuditHistoryConfig with sensible test values.
|
|
|
|
func testAuditHistoryConfig() overlay.AuditHistoryConfig {
|
|
|
|
return overlay.AuditHistoryConfig{
|
|
|
|
WindowSize: time.Hour,
|
|
|
|
TrackingPeriod: time.Hour,
|
|
|
|
GracePeriod: time.Hour,
|
|
|
|
OfflineThreshold: 0,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-03-25 22:25:09 +00:00
|
|
|
func testCache(ctx context.Context, t *testing.T, store overlay.DB) {
|
2019-06-26 11:38:51 +01:00
|
|
|
valid1ID := testrand.NodeID()
|
|
|
|
valid2ID := testrand.NodeID()
|
2019-07-12 15:35:48 +01:00
|
|
|
valid3ID := testrand.NodeID()
|
2019-06-26 11:38:51 +01:00
|
|
|
missingID := testrand.NodeID()
|
2019-05-30 18:35:04 +01:00
|
|
|
address := &pb.NodeAddress{Address: "127.0.0.1:0"}
|
2020-04-29 18:58:41 +01:00
|
|
|
lastNet := "127.0.0"
|
2018-12-17 18:47:26 +00:00
|
|
|
|
2020-07-08 15:28:49 +01:00
|
|
|
nodeSelectionConfig := testNodeSelectionConfig(0, false)
|
2020-08-04 21:28:46 +01:00
|
|
|
serviceConfig := overlay.Config{Node: nodeSelectionConfig, UpdateStatsBatchSize: 100, AuditHistory: testAuditHistoryConfig()}
|
2020-12-22 19:07:07 +00:00
|
|
|
service, err := overlay.NewService(zaptest.NewLogger(t), store, serviceConfig)
|
|
|
|
require.NoError(t, err)
|
2020-04-29 18:58:41 +01:00
|
|
|
d := overlay.NodeCheckInInfo{
|
|
|
|
Address: address,
|
|
|
|
LastIPPort: address.Address,
|
|
|
|
LastNet: lastNet,
|
|
|
|
Version: &pb.NodeVersion{Version: "v1.0.0"},
|
|
|
|
IsUp: true,
|
|
|
|
}
|
2018-11-19 14:40:01 +00:00
|
|
|
{ // Put
|
2020-04-29 18:58:41 +01:00
|
|
|
d.NodeID = valid1ID
|
|
|
|
err := store.UpdateCheckIn(ctx, d, time.Now().UTC(), nodeSelectionConfig)
|
2019-06-28 14:04:50 +01:00
|
|
|
require.NoError(t, err)
|
2018-12-17 18:47:26 +00:00
|
|
|
|
2020-04-29 18:58:41 +01:00
|
|
|
d.NodeID = valid2ID
|
|
|
|
err = store.UpdateCheckIn(ctx, d, time.Now().UTC(), nodeSelectionConfig)
|
2019-06-28 14:04:50 +01:00
|
|
|
require.NoError(t, err)
|
2019-07-12 15:35:48 +01:00
|
|
|
|
2020-04-29 18:58:41 +01:00
|
|
|
d.NodeID = valid3ID
|
|
|
|
err = store.UpdateCheckIn(ctx, d, time.Now().UTC(), nodeSelectionConfig)
|
2019-07-12 15:35:48 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
|
2020-01-03 00:00:18 +00:00
|
|
|
// disqualify one node
|
|
|
|
err = service.DisqualifyNode(ctx, valid3ID)
|
2019-07-12 15:35:48 +01:00
|
|
|
require.NoError(t, err)
|
2018-11-19 14:40:01 +00:00
|
|
|
}
|
2018-11-16 16:31:14 +00:00
|
|
|
|
2018-11-19 14:40:01 +00:00
|
|
|
{ // Get
|
2019-08-06 17:35:59 +01:00
|
|
|
_, err := service.Get(ctx, storj.NodeID{})
|
2019-06-20 14:56:04 +01:00
|
|
|
require.Error(t, err)
|
2020-07-14 14:04:38 +01:00
|
|
|
require.Equal(t, overlay.ErrEmptyNode, err)
|
2018-12-17 18:47:26 +00:00
|
|
|
|
2019-08-06 17:35:59 +01:00
|
|
|
valid1, err := service.Get(ctx, valid1ID)
|
2019-06-20 14:56:04 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
require.Equal(t, valid1.Id, valid1ID)
|
2018-12-17 18:47:26 +00:00
|
|
|
|
2019-08-06 17:35:59 +01:00
|
|
|
valid2, err := service.Get(ctx, valid2ID)
|
2019-06-20 14:56:04 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
require.Equal(t, valid2.Id, valid2ID)
|
2018-11-16 16:31:14 +00:00
|
|
|
|
2019-08-06 17:35:59 +01:00
|
|
|
invalid2, err := service.Get(ctx, missingID)
|
2019-06-20 14:56:04 +01:00
|
|
|
require.Error(t, err)
|
|
|
|
require.True(t, overlay.ErrNodeNotFound.Has(err))
|
|
|
|
require.Nil(t, invalid2)
|
2018-11-16 16:31:14 +00:00
|
|
|
|
2019-01-15 16:08:45 +00:00
|
|
|
// TODO: add erroring database test
|
2018-11-19 14:40:01 +00:00
|
|
|
}
|
2018-11-16 16:31:14 +00:00
|
|
|
|
2019-06-20 14:56:04 +01:00
|
|
|
{ // Reputation
|
2019-08-06 17:35:59 +01:00
|
|
|
valid1, err := service.Get(ctx, valid1ID)
|
2019-06-20 14:56:04 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
require.EqualValues(t, valid1.Id, valid1ID)
|
2020-04-13 22:38:33 +01:00
|
|
|
require.EqualValues(t, valid1.Reputation.AuditReputationAlpha, 1)
|
|
|
|
require.EqualValues(t, valid1.Reputation.AuditReputationBeta, 0)
|
2019-06-20 14:56:04 +01:00
|
|
|
require.Nil(t, valid1.Reputation.Disqualified)
|
|
|
|
|
2019-08-06 17:35:59 +01:00
|
|
|
stats, err := service.UpdateStats(ctx, &overlay.UpdateRequest{
|
2019-06-20 14:56:04 +01:00
|
|
|
NodeID: valid1ID,
|
2020-03-09 15:35:54 +00:00
|
|
|
AuditOutcome: overlay.AuditFailure,
|
2019-06-20 14:56:04 +01:00
|
|
|
})
|
|
|
|
require.NoError(t, err)
|
|
|
|
newAuditAlpha := 1
|
|
|
|
newAuditBeta := 1
|
|
|
|
require.EqualValues(t, stats.AuditReputationAlpha, newAuditAlpha)
|
|
|
|
require.EqualValues(t, stats.AuditReputationBeta, newAuditBeta)
|
|
|
|
require.NotNil(t, stats.Disqualified)
|
2020-03-10 22:05:01 +00:00
|
|
|
require.True(t, time.Since(*stats.Disqualified) < time.Minute)
|
2019-06-20 14:56:04 +01:00
|
|
|
|
2020-01-03 00:00:18 +00:00
|
|
|
err = service.DisqualifyNode(ctx, valid2ID)
|
2019-06-20 14:56:04 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
// should not update once already disqualified
|
2019-08-06 17:35:59 +01:00
|
|
|
_, err = service.BatchUpdateStats(ctx, []*overlay.UpdateRequest{{
|
2019-06-20 14:56:04 +01:00
|
|
|
NodeID: valid2ID,
|
2020-03-09 15:35:54 +00:00
|
|
|
AuditOutcome: overlay.AuditSuccess,
|
2019-07-31 18:21:06 +01:00
|
|
|
}})
|
2019-06-20 14:56:04 +01:00
|
|
|
require.NoError(t, err)
|
2019-08-06 17:35:59 +01:00
|
|
|
dossier, err := service.Get(ctx, valid2ID)
|
2019-06-20 14:56:04 +01:00
|
|
|
|
|
|
|
require.NoError(t, err)
|
2020-04-13 22:38:33 +01:00
|
|
|
require.EqualValues(t, dossier.Reputation.AuditReputationAlpha, 1)
|
|
|
|
require.EqualValues(t, dossier.Reputation.AuditReputationBeta, 0)
|
2019-07-31 18:21:06 +01:00
|
|
|
require.NotNil(t, dossier.Disqualified)
|
2019-06-20 14:56:04 +01:00
|
|
|
}
|
2018-11-16 16:31:14 +00:00
|
|
|
}
|
2019-02-09 21:17:49 +00:00
|
|
|
|
|
|
|
func TestRandomizedSelection(t *testing.T) {
|
|
|
|
t.Parallel()
|
|
|
|
|
|
|
|
totalNodes := 1000
|
|
|
|
selectIterations := 100
|
|
|
|
numNodesToSelect := 100
|
2019-02-11 12:04:00 +00:00
|
|
|
minSelectCount := 3 // TODO: compute this limit better
|
2019-02-09 21:17:49 +00:00
|
|
|
|
2020-01-19 16:29:15 +00:00
|
|
|
satellitedbtest.Run(t, func(ctx *testcontext.Context, t *testing.T, db satellite.DB) {
|
2019-02-09 21:17:49 +00:00
|
|
|
cache := db.OverlayCache()
|
|
|
|
allIDs := make(storj.NodeIDList, totalNodes)
|
|
|
|
nodeCounts := make(map[storj.NodeID]int)
|
2020-07-08 15:28:49 +01:00
|
|
|
config := overlay.NodeSelectionConfig{
|
|
|
|
AuditCount: 1,
|
|
|
|
}
|
2019-02-09 21:17:49 +00:00
|
|
|
|
|
|
|
// put nodes in cache
|
|
|
|
for i := 0; i < totalNodes; i++ {
|
2019-06-26 11:38:51 +01:00
|
|
|
newID := testrand.NodeID()
|
2020-04-29 18:58:41 +01:00
|
|
|
addr := fmt.Sprintf("127.0.%d.0:8080", i)
|
|
|
|
lastNet := fmt.Sprintf("127.0.%d", i)
|
|
|
|
d := overlay.NodeCheckInInfo{
|
|
|
|
NodeID: newID,
|
|
|
|
Address: &pb.NodeAddress{Address: addr, Transport: pb.NodeTransport_TCP_TLS_GRPC},
|
|
|
|
LastIPPort: addr,
|
|
|
|
LastNet: lastNet,
|
|
|
|
Version: &pb.NodeVersion{Version: "v1.0.0"},
|
|
|
|
Capacity: &pb.NodeCapacity{},
|
|
|
|
IsUp: true,
|
|
|
|
}
|
2020-07-08 15:28:49 +01:00
|
|
|
err := cache.UpdateCheckIn(ctx, d, time.Now().UTC(), config)
|
2019-02-09 21:17:49 +00:00
|
|
|
require.NoError(t, err)
|
2019-06-20 14:56:04 +01:00
|
|
|
|
|
|
|
if i%2 == 0 { // make half of nodes "new" and half "vetted"
|
|
|
|
_, err = cache.UpdateStats(ctx, &overlay.UpdateRequest{
|
|
|
|
NodeID: newID,
|
2020-03-09 15:35:54 +00:00
|
|
|
AuditOutcome: overlay.AuditSuccess,
|
2019-06-20 14:56:04 +01:00
|
|
|
AuditLambda: 1,
|
|
|
|
AuditWeight: 1,
|
|
|
|
AuditDQ: 0.5,
|
2020-08-26 21:26:10 +01:00
|
|
|
AuditHistory: testAuditHistoryConfig(),
|
|
|
|
}, time.Now())
|
2019-06-20 14:56:04 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
}
|
|
|
|
|
2019-02-09 21:17:49 +00:00
|
|
|
allIDs[i] = newID
|
|
|
|
nodeCounts[newID] = 0
|
|
|
|
}
|
|
|
|
|
|
|
|
// select numNodesToSelect nodes selectIterations times
|
|
|
|
for i := 0; i < selectIterations; i++ {
|
2020-03-28 14:56:05 +00:00
|
|
|
var nodes []*overlay.SelectedNode
|
2019-02-11 17:10:32 +00:00
|
|
|
var err error
|
|
|
|
|
2019-04-24 11:35:50 +01:00
|
|
|
if i%2 == 0 {
|
2020-04-09 16:19:44 +01:00
|
|
|
nodes, err = cache.SelectStorageNodes(ctx, numNodesToSelect, 0, &overlay.NodeCriteria{
|
2019-06-20 14:56:04 +01:00
|
|
|
OnlineWindow: time.Hour,
|
|
|
|
})
|
2019-02-11 17:10:32 +00:00
|
|
|
require.NoError(t, err)
|
|
|
|
} else {
|
2020-04-09 16:19:44 +01:00
|
|
|
nodes, err = cache.SelectStorageNodes(ctx, numNodesToSelect, numNodesToSelect, &overlay.NodeCriteria{
|
2019-04-26 13:15:06 +01:00
|
|
|
OnlineWindow: time.Hour,
|
2019-02-11 17:10:32 +00:00
|
|
|
})
|
|
|
|
require.NoError(t, err)
|
|
|
|
}
|
2019-02-09 21:17:49 +00:00
|
|
|
require.Len(t, nodes, numNodesToSelect)
|
|
|
|
|
|
|
|
for _, node := range nodes {
|
2020-03-28 14:56:05 +00:00
|
|
|
nodeCounts[node.ID]++
|
2019-02-09 21:17:49 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-02-11 12:04:00 +00:00
|
|
|
belowThreshold := 0
|
|
|
|
|
|
|
|
table := []int{}
|
|
|
|
|
2019-02-09 21:17:49 +00:00
|
|
|
// expect that each node has been selected at least minSelectCount times
|
|
|
|
for _, id := range allIDs {
|
|
|
|
count := nodeCounts[id]
|
2019-02-11 12:04:00 +00:00
|
|
|
if count < minSelectCount {
|
|
|
|
belowThreshold++
|
|
|
|
}
|
|
|
|
if count >= len(table) {
|
|
|
|
table = append(table, make([]int, count-len(table)+1)...)
|
|
|
|
}
|
|
|
|
table[count]++
|
|
|
|
}
|
|
|
|
|
|
|
|
if belowThreshold > totalNodes*1/100 {
|
|
|
|
t.Errorf("%d out of %d were below threshold %d", belowThreshold, totalNodes, minSelectCount)
|
2020-04-24 20:34:53 +01:00
|
|
|
for count, amount := range table {
|
|
|
|
t.Logf("%3d = %4d", count, amount)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
})
|
|
|
|
}
|
|
|
|
func TestRandomizedSelectionCache(t *testing.T) {
|
|
|
|
t.Parallel()
|
|
|
|
|
|
|
|
totalNodes := 1000
|
|
|
|
selectIterations := 100
|
|
|
|
numNodesToSelect := 100
|
|
|
|
minSelectCount := 3
|
|
|
|
|
|
|
|
testplanet.Run(t, testplanet.Config{
|
|
|
|
SatelliteCount: 1, StorageNodeCount: 0, UplinkCount: 0,
|
|
|
|
Reconfigure: testplanet.Reconfigure{
|
|
|
|
Satellite: func(log *zap.Logger, index int, config *satellite.Config) {
|
|
|
|
config.Overlay.NodeSelectionCache.Staleness = -time.Hour
|
|
|
|
config.Overlay.Node.NewNodeFraction = 0.5 // select 50% new nodes
|
|
|
|
config.Overlay.Node.AuditCount = 1
|
|
|
|
},
|
|
|
|
},
|
|
|
|
}, func(t *testing.T, ctx *testcontext.Context, planet *testplanet.Planet) {
|
|
|
|
satellite := planet.Satellites[0]
|
|
|
|
overlaydb := satellite.Overlay.DB
|
2021-01-28 11:46:18 +00:00
|
|
|
uploadSelectionCache := satellite.Overlay.Service.UploadSelectionCache
|
2020-04-24 20:34:53 +01:00
|
|
|
allIDs := make(storj.NodeIDList, totalNodes)
|
|
|
|
nodeCounts := make(map[storj.NodeID]int)
|
|
|
|
expectedNewCount := int(float64(totalNodes) * satellite.Config.Overlay.Node.NewNodeFraction)
|
|
|
|
|
|
|
|
// put nodes in cache
|
|
|
|
for i := 0; i < totalNodes; i++ {
|
|
|
|
newID := testrand.NodeID()
|
|
|
|
address := fmt.Sprintf("127.0.%d.0:8080", i)
|
|
|
|
lastNet := fmt.Sprintf("127.0.%d", i)
|
|
|
|
|
|
|
|
n := overlay.NodeCheckInInfo{
|
|
|
|
NodeID: newID,
|
|
|
|
Address: &pb.NodeAddress{
|
|
|
|
Address: address,
|
|
|
|
Transport: pb.NodeTransport_TCP_TLS_GRPC,
|
|
|
|
},
|
|
|
|
LastNet: lastNet,
|
|
|
|
LastIPPort: address,
|
|
|
|
IsUp: true,
|
|
|
|
Capacity: &pb.NodeCapacity{
|
2020-07-08 15:28:49 +01:00
|
|
|
FreeDisk: 200 * memory.MiB.Int64(),
|
2020-04-24 20:34:53 +01:00
|
|
|
},
|
|
|
|
Version: &pb.NodeVersion{
|
|
|
|
Version: "v1.1.0",
|
|
|
|
CommitHash: "",
|
|
|
|
Timestamp: time.Time{},
|
|
|
|
Release: true,
|
|
|
|
},
|
|
|
|
}
|
|
|
|
defaults := overlay.NodeSelectionConfig{}
|
|
|
|
err := overlaydb.UpdateCheckIn(ctx, n, time.Now().UTC(), defaults)
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
if i%2 == 0 { // make half of nodes "new" and half "vetted"
|
|
|
|
_, err = overlaydb.UpdateStats(ctx, &overlay.UpdateRequest{
|
|
|
|
NodeID: newID,
|
|
|
|
AuditOutcome: overlay.AuditSuccess,
|
|
|
|
AuditLambda: 1,
|
|
|
|
AuditWeight: 1,
|
|
|
|
AuditDQ: 0.5,
|
2020-08-26 21:26:10 +01:00
|
|
|
AuditHistory: testAuditHistoryConfig(),
|
|
|
|
}, time.Now())
|
2020-04-24 20:34:53 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
allIDs[i] = newID
|
|
|
|
nodeCounts[newID] = 0
|
|
|
|
}
|
|
|
|
|
2021-01-28 11:46:18 +00:00
|
|
|
err := uploadSelectionCache.Refresh(ctx)
|
2020-04-24 20:34:53 +01:00
|
|
|
require.NoError(t, err)
|
2021-01-28 11:46:18 +00:00
|
|
|
reputable, new := uploadSelectionCache.Size()
|
2020-04-24 20:34:53 +01:00
|
|
|
require.Equal(t, totalNodes-expectedNewCount, reputable)
|
|
|
|
require.Equal(t, expectedNewCount, new)
|
|
|
|
|
|
|
|
// select numNodesToSelect nodes selectIterations times
|
|
|
|
for i := 0; i < selectIterations; i++ {
|
|
|
|
var nodes []*overlay.SelectedNode
|
|
|
|
var err error
|
|
|
|
req := overlay.FindStorageNodesRequest{
|
|
|
|
RequestedCount: numNodesToSelect,
|
|
|
|
}
|
|
|
|
|
2021-01-28 11:46:18 +00:00
|
|
|
nodes, err = uploadSelectionCache.GetNodes(ctx, req)
|
2020-04-24 20:34:53 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, nodes, numNodesToSelect)
|
|
|
|
|
|
|
|
for _, node := range nodes {
|
|
|
|
nodeCounts[node.ID]++
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
belowThreshold := 0
|
|
|
|
|
|
|
|
table := []int{}
|
|
|
|
|
|
|
|
// expect that each node has been selected at least minSelectCount times
|
|
|
|
for _, id := range allIDs {
|
|
|
|
count := nodeCounts[id]
|
|
|
|
if count < minSelectCount {
|
|
|
|
belowThreshold++
|
|
|
|
}
|
|
|
|
if count >= len(table) {
|
|
|
|
table = append(table, make([]int, count-len(table)+1)...)
|
|
|
|
}
|
|
|
|
table[count]++
|
|
|
|
}
|
|
|
|
|
|
|
|
if belowThreshold > totalNodes*1/100 {
|
|
|
|
t.Errorf("%d out of %d were below threshold %d", belowThreshold, totalNodes, minSelectCount)
|
2019-02-11 12:04:00 +00:00
|
|
|
for count, amount := range table {
|
|
|
|
t.Logf("%3d = %4d", count, amount)
|
|
|
|
}
|
2019-02-09 21:17:49 +00:00
|
|
|
}
|
|
|
|
})
|
|
|
|
}
|
2019-05-30 20:52:33 +01:00
|
|
|
|
2019-06-11 14:30:28 +01:00
|
|
|
func TestNodeInfo(t *testing.T) {
|
|
|
|
testplanet.Run(t, testplanet.Config{
|
|
|
|
SatelliteCount: 1, StorageNodeCount: 1, UplinkCount: 0,
|
|
|
|
}, func(t *testing.T, ctx *testcontext.Context, planet *testplanet.Planet) {
|
|
|
|
planet.StorageNodes[0].Storage2.Monitor.Loop.Pause()
|
|
|
|
|
|
|
|
node, err := planet.Satellites[0].Overlay.Service.Get(ctx, planet.StorageNodes[0].ID())
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
2020-05-19 17:21:44 +01:00
|
|
|
dossier := planet.StorageNodes[0].Contact.Service.Local()
|
|
|
|
|
2019-06-11 14:30:28 +01:00
|
|
|
assert.Equal(t, pb.NodeType_STORAGE, node.Type)
|
|
|
|
assert.NotEmpty(t, node.Operator.Email)
|
|
|
|
assert.NotEmpty(t, node.Operator.Wallet)
|
2020-05-19 17:21:44 +01:00
|
|
|
assert.Equal(t, dossier.Operator, node.Operator)
|
2019-06-11 14:30:28 +01:00
|
|
|
assert.NotEmpty(t, node.Capacity.FreeDisk)
|
2020-05-19 17:21:44 +01:00
|
|
|
assert.Equal(t, dossier.Capacity, node.Capacity)
|
2019-06-11 14:30:28 +01:00
|
|
|
assert.NotEmpty(t, node.Version.Version)
|
2020-05-19 17:21:44 +01:00
|
|
|
assert.Equal(t, dossier.Version.Version, node.Version.Version)
|
2019-06-11 14:30:28 +01:00
|
|
|
})
|
|
|
|
}
|
2019-09-19 19:37:31 +01:00
|
|
|
|
2020-03-30 14:32:02 +01:00
|
|
|
func TestGetOnlineNodesForGetDelete(t *testing.T) {
|
2020-03-13 18:01:48 +00:00
|
|
|
testplanet.Run(t, testplanet.Config{
|
|
|
|
SatelliteCount: 1, StorageNodeCount: 2, UplinkCount: 0,
|
|
|
|
}, func(t *testing.T, ctx *testcontext.Context, planet *testplanet.Planet) {
|
|
|
|
// pause chores that might update node data
|
|
|
|
planet.Satellites[0].Audit.Chore.Loop.Pause()
|
|
|
|
planet.Satellites[0].Repair.Checker.Loop.Pause()
|
|
|
|
planet.Satellites[0].Repair.Repairer.Loop.Pause()
|
|
|
|
for _, node := range planet.StorageNodes {
|
|
|
|
node.Contact.Chore.Pause(ctx)
|
|
|
|
}
|
|
|
|
|
|
|
|
// should not return anything if nodeIDs aren't in the nodes table
|
2020-03-30 14:32:02 +01:00
|
|
|
actualNodes, err := planet.Satellites[0].Overlay.Service.GetOnlineNodesForGetDelete(ctx, []storj.NodeID{})
|
2020-03-13 18:01:48 +00:00
|
|
|
require.NoError(t, err)
|
|
|
|
require.Equal(t, 0, len(actualNodes))
|
2020-03-30 14:32:02 +01:00
|
|
|
actualNodes, err = planet.Satellites[0].Overlay.Service.GetOnlineNodesForGetDelete(ctx, []storj.NodeID{testrand.NodeID()})
|
2020-03-13 18:01:48 +00:00
|
|
|
require.NoError(t, err)
|
|
|
|
require.Equal(t, 0, len(actualNodes))
|
|
|
|
|
2020-03-30 14:32:02 +01:00
|
|
|
expectedNodes := make(map[storj.NodeID]*overlay.SelectedNode, len(planet.StorageNodes))
|
2020-03-13 18:01:48 +00:00
|
|
|
nodeIDs := make([]storj.NodeID, len(planet.StorageNodes)+1)
|
|
|
|
for i, node := range planet.StorageNodes {
|
|
|
|
nodeIDs[i] = node.ID()
|
2020-03-30 14:32:02 +01:00
|
|
|
dossier, err := planet.Satellites[0].Overlay.Service.Get(ctx, node.ID())
|
2020-03-13 18:01:48 +00:00
|
|
|
require.NoError(t, err)
|
2020-03-30 14:32:02 +01:00
|
|
|
expectedNodes[dossier.Id] = &overlay.SelectedNode{
|
|
|
|
ID: dossier.Id,
|
|
|
|
Address: dossier.Address,
|
|
|
|
LastNet: dossier.LastNet,
|
|
|
|
LastIPPort: dossier.LastIPPort,
|
|
|
|
}
|
2020-03-13 18:01:48 +00:00
|
|
|
}
|
2020-03-30 14:32:02 +01:00
|
|
|
// add a fake node ID to make sure GetOnlineNodesForGetDelete doesn't error and still returns the expected nodes.
|
2020-03-13 18:01:48 +00:00
|
|
|
nodeIDs[len(planet.StorageNodes)] = testrand.NodeID()
|
|
|
|
|
2020-03-30 14:32:02 +01:00
|
|
|
actualNodes, err = planet.Satellites[0].Overlay.Service.GetOnlineNodesForGetDelete(ctx, nodeIDs)
|
2020-03-13 18:01:48 +00:00
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
require.True(t, reflect.DeepEqual(expectedNodes, actualNodes))
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2019-12-16 13:45:13 +00:00
|
|
|
func TestKnownReliable(t *testing.T) {
|
|
|
|
testplanet.Run(t, testplanet.Config{
|
2021-03-18 19:55:06 +00:00
|
|
|
SatelliteCount: 1, StorageNodeCount: 6, UplinkCount: 1,
|
|
|
|
Reconfigure: testplanet.Reconfigure{
|
|
|
|
Satellite: func(log *zap.Logger, index int, config *satellite.Config) {
|
|
|
|
config.Overlay.AuditHistory = overlay.AuditHistoryConfig{
|
|
|
|
WindowSize: time.Hour,
|
|
|
|
TrackingPeriod: 2 * time.Hour,
|
|
|
|
GracePeriod: time.Hour,
|
|
|
|
OfflineThreshold: 0.6,
|
|
|
|
OfflineDQEnabled: false,
|
|
|
|
OfflineSuspensionEnabled: true,
|
|
|
|
}
|
|
|
|
},
|
|
|
|
},
|
2019-12-16 13:45:13 +00:00
|
|
|
}, func(t *testing.T, ctx *testcontext.Context, planet *testplanet.Planet) {
|
|
|
|
satellite := planet.Satellites[0]
|
|
|
|
service := satellite.Overlay.Service
|
|
|
|
|
|
|
|
// Disqualify storage node #0
|
2020-03-11 21:11:46 +00:00
|
|
|
err := satellite.DB.OverlayCache().DisqualifyNode(ctx, planet.StorageNodes[0].ID())
|
2019-12-16 13:45:13 +00:00
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
// Stop storage node #1
|
2020-03-11 21:11:46 +00:00
|
|
|
offlineNode := planet.StorageNodes[1]
|
|
|
|
err = planet.StopPeer(offlineNode)
|
2019-12-16 13:45:13 +00:00
|
|
|
require.NoError(t, err)
|
2020-03-11 21:11:46 +00:00
|
|
|
// set last contact success to 1 hour ago to make node appear offline
|
|
|
|
checkInInfo := getNodeInfo(offlineNode.ID())
|
|
|
|
err = service.UpdateCheckIn(ctx, checkInInfo, time.Now().Add(-time.Hour))
|
2019-12-16 13:45:13 +00:00
|
|
|
require.NoError(t, err)
|
2020-03-11 21:11:46 +00:00
|
|
|
// Check that storage node #1 is offline
|
|
|
|
node, err := service.Get(ctx, offlineNode.ID())
|
2019-12-16 13:45:13 +00:00
|
|
|
require.NoError(t, err)
|
|
|
|
require.False(t, service.IsOnline(node))
|
|
|
|
|
2021-03-18 19:55:06 +00:00
|
|
|
// unknown audit suspend storage node #2
|
2020-06-10 17:11:25 +01:00
|
|
|
err = satellite.DB.OverlayCache().SuspendNodeUnknownAudit(ctx, planet.StorageNodes[2].ID(), time.Now())
|
2020-03-11 21:11:46 +00:00
|
|
|
require.NoError(t, err)
|
|
|
|
|
2021-03-18 19:55:06 +00:00
|
|
|
// offline suspend storage node #3
|
|
|
|
require.NoError(t, offlineSuspendNode(ctx, satellite.Overlay.DB, &planet.Satellites[0].Config.Overlay.AuditHistory, planet.StorageNodes[3].ID()))
|
|
|
|
|
|
|
|
// Check that only storage nodes #4 and #5 are reliable
|
2019-12-16 13:45:13 +00:00
|
|
|
result, err := service.KnownReliable(ctx, []storj.NodeID{
|
|
|
|
planet.StorageNodes[0].ID(),
|
|
|
|
planet.StorageNodes[1].ID(),
|
|
|
|
planet.StorageNodes[2].ID(),
|
|
|
|
planet.StorageNodes[3].ID(),
|
2020-03-11 21:11:46 +00:00
|
|
|
planet.StorageNodes[4].ID(),
|
2021-03-18 19:55:06 +00:00
|
|
|
planet.StorageNodes[5].ID(),
|
2019-12-16 13:45:13 +00:00
|
|
|
})
|
|
|
|
require.NoError(t, err)
|
2020-12-31 17:00:43 +00:00
|
|
|
require.Len(t, result, 2)
|
2019-12-16 13:45:13 +00:00
|
|
|
|
|
|
|
// Sort the storage nodes for predictable checks
|
2020-05-19 17:21:44 +01:00
|
|
|
expectedReliable := []storj.NodeURL{
|
|
|
|
planet.StorageNodes[4].NodeURL(),
|
2021-03-18 19:55:06 +00:00
|
|
|
planet.StorageNodes[5].NodeURL(),
|
2020-05-19 17:21:44 +01:00
|
|
|
}
|
|
|
|
sort.Slice(expectedReliable, func(i, j int) bool { return expectedReliable[i].ID.Less(expectedReliable[j].ID) })
|
2019-12-16 13:45:13 +00:00
|
|
|
sort.Slice(result, func(i, j int) bool { return result[i].Id.Less(result[j].Id) })
|
|
|
|
|
|
|
|
// Assert the reliable nodes are the expected ones
|
|
|
|
for i, node := range result {
|
2020-05-19 17:21:44 +01:00
|
|
|
assert.Equal(t, expectedReliable[i].ID, node.Id)
|
|
|
|
assert.Equal(t, expectedReliable[i].Address, node.Address.Address)
|
2019-12-16 13:45:13 +00:00
|
|
|
}
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2019-09-19 19:37:31 +01:00
|
|
|
func TestUpdateCheckIn(t *testing.T) {
|
2020-01-19 16:29:15 +00:00
|
|
|
satellitedbtest.Run(t, func(ctx *testcontext.Context, t *testing.T, db satellite.DB) { // setup
|
2019-09-19 19:37:31 +01:00
|
|
|
nodeID := storj.NodeID{1, 2, 3}
|
|
|
|
expectedEmail := "test@email.com"
|
2020-03-06 22:04:23 +00:00
|
|
|
expectedAddress := "1.2.4.4:8080"
|
2019-09-19 19:37:31 +01:00
|
|
|
info := overlay.NodeCheckInInfo{
|
|
|
|
NodeID: nodeID,
|
|
|
|
Address: &pb.NodeAddress{
|
|
|
|
Address: expectedAddress,
|
|
|
|
},
|
|
|
|
IsUp: true,
|
|
|
|
Capacity: &pb.NodeCapacity{
|
2020-02-12 21:19:42 +00:00
|
|
|
FreeDisk: int64(5678),
|
2019-09-19 19:37:31 +01:00
|
|
|
},
|
|
|
|
Operator: &pb.NodeOperator{
|
2021-01-18 14:33:13 +00:00
|
|
|
Email: expectedEmail,
|
|
|
|
Wallet: "0x123",
|
|
|
|
WalletFeatures: []string{"example"},
|
2019-09-19 19:37:31 +01:00
|
|
|
},
|
|
|
|
Version: &pb.NodeVersion{
|
|
|
|
Version: "v0.0.0",
|
|
|
|
CommitHash: "",
|
|
|
|
Timestamp: time.Time{},
|
|
|
|
Release: false,
|
|
|
|
},
|
2020-03-06 22:04:23 +00:00
|
|
|
LastIPPort: expectedAddress,
|
|
|
|
LastNet: "1.2.4",
|
2019-09-19 19:37:31 +01:00
|
|
|
}
|
|
|
|
expectedNode := &overlay.NodeDossier{
|
|
|
|
Node: pb.Node{
|
2020-03-06 22:04:23 +00:00
|
|
|
Id: nodeID,
|
2019-09-19 19:37:31 +01:00
|
|
|
Address: &pb.NodeAddress{
|
|
|
|
Address: info.Address.GetAddress(),
|
|
|
|
Transport: pb.NodeTransport_TCP_TLS_GRPC,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
Type: pb.NodeType_STORAGE,
|
|
|
|
Operator: pb.NodeOperator{
|
2021-01-18 14:33:13 +00:00
|
|
|
Email: info.Operator.GetEmail(),
|
|
|
|
Wallet: info.Operator.GetWallet(),
|
|
|
|
WalletFeatures: info.Operator.GetWalletFeatures(),
|
2019-09-19 19:37:31 +01:00
|
|
|
},
|
|
|
|
Capacity: pb.NodeCapacity{
|
2020-02-12 21:19:42 +00:00
|
|
|
FreeDisk: info.Capacity.GetFreeDisk(),
|
2019-09-19 19:37:31 +01:00
|
|
|
},
|
|
|
|
Version: pb.NodeVersion{
|
|
|
|
Version: "v0.0.0",
|
|
|
|
CommitHash: "",
|
|
|
|
Timestamp: time.Time{},
|
|
|
|
Release: false,
|
|
|
|
},
|
|
|
|
Contained: false,
|
|
|
|
Disqualified: nil,
|
|
|
|
PieceCount: 0,
|
2019-10-11 22:18:05 +01:00
|
|
|
ExitStatus: overlay.ExitStatus{NodeID: nodeID},
|
2020-03-06 22:04:23 +00:00
|
|
|
LastIPPort: expectedAddress,
|
|
|
|
LastNet: "1.2.4",
|
2019-09-19 19:37:31 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
// confirm the node doesn't exist in nodes table yet
|
|
|
|
_, err := db.OverlayCache().Get(ctx, nodeID)
|
|
|
|
require.Error(t, err)
|
|
|
|
require.Contains(t, err.Error(), "node not found")
|
|
|
|
|
|
|
|
// check-in for that node id, which should add the node
|
|
|
|
// to the nodes tables in the database
|
2020-03-10 22:05:01 +00:00
|
|
|
startOfTest := time.Now()
|
2020-04-29 17:29:19 +01:00
|
|
|
err = db.OverlayCache().UpdateCheckIn(ctx, info, startOfTest.Add(time.Second), overlay.NodeSelectionConfig{})
|
2019-09-19 19:37:31 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
// confirm that the node is now in the nodes table with the
|
|
|
|
// correct fields set
|
|
|
|
actualNode, err := db.OverlayCache().Get(ctx, nodeID)
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.True(t, actualNode.Reputation.LastContactSuccess.After(startOfTest))
|
2019-11-15 22:43:06 +00:00
|
|
|
require.True(t, actualNode.Reputation.LastContactFailure.UTC().Equal(time.Time{}.UTC()))
|
2020-04-13 22:38:33 +01:00
|
|
|
actualNode.Address = expectedNode.Address
|
2019-09-19 19:37:31 +01:00
|
|
|
|
|
|
|
// we need to overwrite the times so that the deep equal considers them the same
|
|
|
|
expectedNode.Reputation.LastContactSuccess = actualNode.Reputation.LastContactSuccess
|
|
|
|
expectedNode.Reputation.LastContactFailure = actualNode.Reputation.LastContactFailure
|
2020-04-13 22:38:33 +01:00
|
|
|
expectedNode.Reputation.AuditReputationAlpha = 1
|
|
|
|
expectedNode.Reputation.UnknownAuditReputationAlpha = 1
|
|
|
|
expectedNode.Reputation.AuditReputationBeta = 0
|
|
|
|
expectedNode.Reputation.UnknownAuditReputationBeta = 0
|
2020-08-28 20:43:53 +01:00
|
|
|
expectedNode.Reputation.OnlineScore = 1
|
2019-09-19 19:37:31 +01:00
|
|
|
expectedNode.Version.Timestamp = actualNode.Version.Timestamp
|
2019-10-23 02:06:01 +01:00
|
|
|
expectedNode.CreatedAt = actualNode.CreatedAt
|
2019-10-11 22:18:05 +01:00
|
|
|
require.Equal(t, expectedNode, actualNode)
|
2019-09-19 19:37:31 +01:00
|
|
|
|
|
|
|
// confirm that we can update the address field
|
2020-03-10 22:05:01 +00:00
|
|
|
startOfUpdateTest := time.Now()
|
2019-09-19 19:37:31 +01:00
|
|
|
expectedAddress = "9.8.7.6"
|
|
|
|
updatedInfo := overlay.NodeCheckInInfo{
|
|
|
|
NodeID: nodeID,
|
|
|
|
Address: &pb.NodeAddress{
|
|
|
|
Address: expectedAddress,
|
|
|
|
},
|
|
|
|
IsUp: true,
|
|
|
|
Version: &pb.NodeVersion{
|
2019-09-26 01:07:39 +01:00
|
|
|
Version: "v0.1.0",
|
|
|
|
CommitHash: "abc123",
|
2020-03-10 22:05:01 +00:00
|
|
|
Timestamp: time.Now(),
|
2019-09-26 01:07:39 +01:00
|
|
|
Release: true,
|
2019-09-19 19:37:31 +01:00
|
|
|
},
|
2020-03-06 22:04:23 +00:00
|
|
|
LastIPPort: expectedAddress,
|
|
|
|
LastNet: "9.8.7",
|
2019-09-19 19:37:31 +01:00
|
|
|
}
|
|
|
|
// confirm that the updated node is in the nodes table with the
|
|
|
|
// correct updated fields set
|
2020-04-29 17:29:19 +01:00
|
|
|
err = db.OverlayCache().UpdateCheckIn(ctx, updatedInfo, startOfUpdateTest.Add(time.Second), overlay.NodeSelectionConfig{})
|
2019-09-19 19:37:31 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
updatedNode, err := db.OverlayCache().Get(ctx, nodeID)
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.True(t, updatedNode.Reputation.LastContactSuccess.After(startOfUpdateTest))
|
2020-03-10 22:05:01 +00:00
|
|
|
require.True(t, updatedNode.Reputation.LastContactFailure.Equal(time.Time{}))
|
2019-09-19 19:37:31 +01:00
|
|
|
require.Equal(t, updatedNode.Address.GetAddress(), expectedAddress)
|
2019-09-26 01:07:39 +01:00
|
|
|
require.Equal(t, updatedInfo.Version.GetVersion(), updatedNode.Version.GetVersion())
|
|
|
|
require.Equal(t, updatedInfo.Version.GetCommitHash(), updatedNode.Version.GetCommitHash())
|
|
|
|
require.Equal(t, updatedInfo.Version.GetRelease(), updatedNode.Version.GetRelease())
|
|
|
|
require.True(t, updatedNode.Version.GetTimestamp().After(info.Version.GetTimestamp()))
|
2019-09-19 19:37:31 +01:00
|
|
|
|
2020-03-10 22:05:01 +00:00
|
|
|
// confirm we can udpate IsUp field
|
|
|
|
startOfUpdateTest2 := time.Now()
|
2019-09-19 19:37:31 +01:00
|
|
|
updatedInfo2 := overlay.NodeCheckInInfo{
|
|
|
|
NodeID: nodeID,
|
|
|
|
Address: &pb.NodeAddress{
|
|
|
|
Address: "9.8.7.6",
|
|
|
|
},
|
|
|
|
IsUp: false,
|
|
|
|
Version: &pb.NodeVersion{
|
|
|
|
Version: "v0.0.0",
|
|
|
|
CommitHash: "",
|
|
|
|
Timestamp: time.Time{},
|
|
|
|
Release: false,
|
|
|
|
},
|
|
|
|
}
|
2020-04-29 17:29:19 +01:00
|
|
|
|
|
|
|
err = db.OverlayCache().UpdateCheckIn(ctx, updatedInfo2, startOfUpdateTest2.Add(time.Second), overlay.NodeSelectionConfig{})
|
2019-09-19 19:37:31 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
updated2Node, err := db.OverlayCache().Get(ctx, nodeID)
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.True(t, updated2Node.Reputation.LastContactSuccess.Equal(updatedNode.Reputation.LastContactSuccess))
|
|
|
|
require.True(t, updated2Node.Reputation.LastContactFailure.After(startOfUpdateTest2))
|
|
|
|
})
|
|
|
|
}
|
2019-12-30 17:10:24 +00:00
|
|
|
|
2020-07-16 15:18:02 +01:00
|
|
|
// TestSuspendedSelection ensures that suspended nodes are not selected by SelectStorageNodes.
|
2020-03-11 21:11:46 +00:00
|
|
|
func TestSuspendedSelection(t *testing.T) {
|
|
|
|
totalNodes := 10
|
|
|
|
|
|
|
|
satellitedbtest.Run(t, func(ctx *testcontext.Context, t *testing.T, db satellite.DB) {
|
|
|
|
cache := db.OverlayCache()
|
|
|
|
suspendedIDs := make(map[storj.NodeID]bool)
|
2020-07-08 15:28:49 +01:00
|
|
|
config := overlay.NodeSelectionConfig{AuditCount: 1}
|
2020-03-11 21:11:46 +00:00
|
|
|
|
|
|
|
// put nodes in cache
|
|
|
|
for i := 0; i < totalNodes; i++ {
|
|
|
|
newID := testrand.NodeID()
|
2020-04-29 18:58:41 +01:00
|
|
|
addr := fmt.Sprintf("127.0.%d.0:8080", i)
|
|
|
|
lastNet := fmt.Sprintf("127.0.%d", i)
|
|
|
|
d := overlay.NodeCheckInInfo{
|
|
|
|
NodeID: newID,
|
|
|
|
Address: &pb.NodeAddress{Address: addr, Transport: pb.NodeTransport_TCP_TLS_GRPC},
|
|
|
|
LastIPPort: addr,
|
|
|
|
LastNet: lastNet,
|
|
|
|
Version: &pb.NodeVersion{Version: "v1.0.0"},
|
|
|
|
Capacity: &pb.NodeCapacity{},
|
|
|
|
IsUp: true,
|
|
|
|
}
|
2020-07-08 15:28:49 +01:00
|
|
|
err := cache.UpdateCheckIn(ctx, d, time.Now().UTC(), config)
|
2020-03-11 21:11:46 +00:00
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
if i%2 == 0 { // make half of nodes "new" and half "vetted"
|
|
|
|
_, err = cache.UpdateStats(ctx, &overlay.UpdateRequest{
|
|
|
|
NodeID: newID,
|
|
|
|
AuditOutcome: overlay.AuditSuccess,
|
|
|
|
AuditLambda: 1,
|
|
|
|
AuditWeight: 1,
|
|
|
|
AuditDQ: 0.5,
|
2020-08-26 21:26:10 +01:00
|
|
|
AuditHistory: testAuditHistoryConfig(),
|
|
|
|
}, time.Now().UTC())
|
2020-03-11 21:11:46 +00:00
|
|
|
require.NoError(t, err)
|
|
|
|
}
|
|
|
|
|
2021-03-18 19:55:06 +00:00
|
|
|
ahConfig := &overlay.AuditHistoryConfig{
|
|
|
|
WindowSize: time.Hour,
|
|
|
|
TrackingPeriod: 2 * time.Hour,
|
|
|
|
GracePeriod: time.Hour,
|
|
|
|
OfflineThreshold: 0.6,
|
|
|
|
OfflineDQEnabled: false,
|
|
|
|
OfflineSuspensionEnabled: true,
|
|
|
|
}
|
|
|
|
|
2020-03-11 21:11:46 +00:00
|
|
|
// suspend the first four nodes (2 new, 2 vetted)
|
2021-03-18 19:55:06 +00:00
|
|
|
// 2 offline suspended and 2 unknown audit suspended
|
2020-03-11 21:11:46 +00:00
|
|
|
if i < 4 {
|
2021-03-18 19:55:06 +00:00
|
|
|
if i < 2 {
|
|
|
|
require.NoError(t, offlineSuspendNode(ctx, cache, ahConfig, newID))
|
|
|
|
continue
|
|
|
|
}
|
2020-06-10 17:11:25 +01:00
|
|
|
err = cache.SuspendNodeUnknownAudit(ctx, newID, time.Now())
|
2020-03-11 21:11:46 +00:00
|
|
|
require.NoError(t, err)
|
|
|
|
suspendedIDs[newID] = true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-03-28 14:56:05 +00:00
|
|
|
var nodes []*overlay.SelectedNode
|
2020-03-11 21:11:46 +00:00
|
|
|
var err error
|
|
|
|
|
|
|
|
numNodesToSelect := 10
|
|
|
|
|
|
|
|
// select 10 vetted nodes - 5 vetted, 2 suspended, so expect 3
|
2020-04-09 16:19:44 +01:00
|
|
|
nodes, err = cache.SelectStorageNodes(ctx, numNodesToSelect, 0, &overlay.NodeCriteria{
|
2020-03-11 21:11:46 +00:00
|
|
|
OnlineWindow: time.Hour,
|
|
|
|
})
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, nodes, 3)
|
|
|
|
for _, node := range nodes {
|
2020-03-28 14:56:05 +00:00
|
|
|
require.False(t, suspendedIDs[node.ID])
|
2020-03-11 21:11:46 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// select 10 new nodes - 5 new, 2 suspended, so expect 3
|
2020-04-09 16:19:44 +01:00
|
|
|
nodes, err = cache.SelectStorageNodes(ctx, numNodesToSelect, numNodesToSelect, &overlay.NodeCriteria{
|
2020-03-11 21:11:46 +00:00
|
|
|
OnlineWindow: time.Hour,
|
|
|
|
})
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, nodes, 3)
|
|
|
|
for _, node := range nodes {
|
2020-03-28 14:56:05 +00:00
|
|
|
require.False(t, suspendedIDs[node.ID])
|
2020-03-11 21:11:46 +00:00
|
|
|
}
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2020-06-08 16:27:08 +01:00
|
|
|
func TestConcurrentAudit(t *testing.T) {
|
|
|
|
testplanet.Run(t, testplanet.Config{
|
|
|
|
SatelliteCount: 1, StorageNodeCount: 1, UplinkCount: 1,
|
|
|
|
}, func(t *testing.T, ctx *testcontext.Context, planet *testplanet.Planet) {
|
|
|
|
planet.Satellites[0].Audit.Chore.Loop.Stop()
|
|
|
|
data := testrand.Bytes(10 * memory.MB)
|
|
|
|
err := planet.Uplinks[0].Upload(ctx, planet.Satellites[0], "bucket", "testpath", data)
|
|
|
|
require.NoError(t, err)
|
|
|
|
var group errgroup.Group
|
|
|
|
n := 5
|
|
|
|
for i := 0; i < n; i++ {
|
|
|
|
group.Go(func() error {
|
|
|
|
_, err := planet.Satellites[0].Overlay.Service.UpdateStats(ctx, &overlay.UpdateRequest{
|
|
|
|
NodeID: planet.StorageNodes[0].ID(),
|
|
|
|
AuditOutcome: overlay.AuditSuccess,
|
|
|
|
})
|
|
|
|
return err
|
|
|
|
})
|
|
|
|
}
|
|
|
|
err = group.Wait()
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
node, err := planet.Satellites[0].DB.OverlayCache().Get(ctx, planet.StorageNodes[0].ID())
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.Equal(t, int64(n), node.Reputation.AuditCount)
|
|
|
|
|
|
|
|
for i := 0; i < n; i++ {
|
|
|
|
group.Go(func() error {
|
|
|
|
_, err := planet.Satellites[0].Overlay.Service.BatchUpdateStats(ctx, []*overlay.UpdateRequest{
|
|
|
|
{
|
|
|
|
NodeID: planet.StorageNodes[0].ID(),
|
|
|
|
AuditOutcome: overlay.AuditSuccess,
|
|
|
|
},
|
|
|
|
})
|
|
|
|
return err
|
|
|
|
})
|
|
|
|
}
|
|
|
|
err = group.Wait()
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
node, err = planet.Satellites[0].DB.OverlayCache().Get(ctx, planet.StorageNodes[0].ID())
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.Equal(t, int64(n*2), node.Reputation.AuditCount)
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2020-01-02 20:41:18 +00:00
|
|
|
func getNodeInfo(nodeID storj.NodeID) overlay.NodeCheckInInfo {
|
|
|
|
return overlay.NodeCheckInInfo{
|
|
|
|
NodeID: nodeID,
|
|
|
|
IsUp: true,
|
|
|
|
Address: &pb.NodeAddress{
|
|
|
|
Address: "1.2.3.4",
|
|
|
|
},
|
|
|
|
Operator: &pb.NodeOperator{
|
|
|
|
Email: "test@email.com",
|
|
|
|
Wallet: "0x123",
|
|
|
|
},
|
|
|
|
Version: &pb.NodeVersion{
|
|
|
|
Version: "v0.0.0",
|
|
|
|
CommitHash: "",
|
|
|
|
Timestamp: time.Time{},
|
|
|
|
Release: false,
|
|
|
|
},
|
|
|
|
}
|
|
|
|
}
|
2020-07-08 15:28:49 +01:00
|
|
|
|
2021-06-17 15:01:21 +01:00
|
|
|
func TestUpdateReputation(t *testing.T) {
|
|
|
|
testplanet.Run(t, testplanet.Config{
|
|
|
|
SatelliteCount: 1, StorageNodeCount: 1, UplinkCount: 0,
|
|
|
|
}, func(t *testing.T, ctx *testcontext.Context, planet *testplanet.Planet) {
|
|
|
|
service := planet.Satellites[0].Overlay.Service
|
2021-06-23 00:09:39 +01:00
|
|
|
overlaydb := planet.Satellites[0].Overlay.DB
|
2021-06-17 15:01:21 +01:00
|
|
|
node := planet.StorageNodes[0]
|
|
|
|
|
|
|
|
info, err := service.Get(ctx, node.ID())
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.False(t, info.Contained)
|
|
|
|
require.Nil(t, info.Disqualified)
|
|
|
|
require.Nil(t, info.UnknownAuditSuspended)
|
|
|
|
require.Nil(t, info.OfflineSuspended)
|
|
|
|
require.Nil(t, info.Reputation.VettedAt)
|
|
|
|
|
|
|
|
t0 := time.Now().Truncate(time.Hour)
|
|
|
|
t1 := t0.Add(time.Hour)
|
|
|
|
t2 := t0.Add(2 * time.Hour)
|
|
|
|
t3 := t0.Add(3 * time.Hour)
|
|
|
|
|
|
|
|
reputationChange := &overlay.ReputationStatus{
|
|
|
|
Contained: true,
|
|
|
|
Disqualified: &t0,
|
|
|
|
UnknownAuditSuspended: &t1,
|
|
|
|
OfflineSuspended: &t2,
|
|
|
|
VettedAt: &t3,
|
|
|
|
}
|
|
|
|
err = service.UpdateReputation(ctx, node.ID(), reputationChange)
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
info, err = service.Get(ctx, node.ID())
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.True(t, info.Contained)
|
|
|
|
require.Equal(t, reputationChange.Disqualified, info.Disqualified)
|
|
|
|
require.Equal(t, reputationChange.UnknownAuditSuspended, info.UnknownAuditSuspended)
|
|
|
|
require.Equal(t, reputationChange.OfflineSuspended, info.OfflineSuspended)
|
|
|
|
require.Equal(t, reputationChange.VettedAt, info.Reputation.VettedAt)
|
|
|
|
|
|
|
|
reputationChange.Contained = false
|
|
|
|
reputationChange.Disqualified = nil
|
|
|
|
|
|
|
|
err = service.UpdateReputation(ctx, node.ID(), reputationChange)
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
info, err = service.Get(ctx, node.ID())
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.False(t, info.Contained)
|
|
|
|
require.Equal(t, reputationChange.Disqualified, info.Disqualified)
|
2021-06-23 00:09:39 +01:00
|
|
|
|
|
|
|
nodeInfo, err := overlaydb.UpdateExitStatus(ctx, &overlay.ExitStatusRequest{
|
|
|
|
NodeID: node.ID(),
|
|
|
|
ExitInitiatedAt: t0,
|
|
|
|
ExitLoopCompletedAt: t1,
|
|
|
|
ExitFinishedAt: t1,
|
|
|
|
ExitSuccess: true,
|
|
|
|
})
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.NotNil(t, nodeInfo.ExitStatus.ExitFinishedAt)
|
|
|
|
|
|
|
|
// make sure Disqualified field is not updated if a node has finished
|
|
|
|
// graceful exit
|
|
|
|
reputationChange.Disqualified = &t0
|
|
|
|
err = service.UpdateReputation(ctx, node.ID(), reputationChange)
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
exitedNodeInfo, err := service.Get(ctx, node.ID())
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.Equal(t, info.Disqualified, exitedNodeInfo.Disqualified)
|
2021-06-17 15:01:21 +01:00
|
|
|
})
|
|
|
|
}
|
|
|
|
|
2020-07-08 15:28:49 +01:00
|
|
|
func TestVetAndUnvetNode(t *testing.T) {
|
|
|
|
testplanet.Run(t, testplanet.Config{
|
|
|
|
SatelliteCount: 1, StorageNodeCount: 2, UplinkCount: 0,
|
|
|
|
}, func(t *testing.T, ctx *testcontext.Context, planet *testplanet.Planet) {
|
|
|
|
service := planet.Satellites[0].Overlay.Service
|
|
|
|
node := planet.StorageNodes[0]
|
|
|
|
|
|
|
|
// clear existing data
|
|
|
|
err := service.TestUnvetNode(ctx, node.ID())
|
|
|
|
require.NoError(t, err)
|
|
|
|
dossier, err := service.Get(ctx, node.ID())
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.Nil(t, dossier.Reputation.VettedAt)
|
|
|
|
|
|
|
|
// vet again
|
|
|
|
vettedTime, err := service.TestVetNode(ctx, node.ID())
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.NotNil(t, vettedTime)
|
|
|
|
dossier, err = service.Get(ctx, node.ID())
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.NotNil(t, dossier.Reputation.VettedAt)
|
|
|
|
|
|
|
|
// unvet again
|
|
|
|
err = service.TestUnvetNode(ctx, node.ID())
|
|
|
|
require.NoError(t, err)
|
|
|
|
dossier, err = service.Get(ctx, node.ID())
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.Nil(t, dossier.Reputation.VettedAt)
|
|
|
|
})
|
|
|
|
}
|
2021-03-18 19:55:06 +00:00
|
|
|
|
|
|
|
func offlineSuspendNode(ctx context.Context, oc overlay.DB, config *overlay.AuditHistoryConfig, nodeID storj.NodeID) error {
|
|
|
|
updateReq := &overlay.UpdateRequest{
|
|
|
|
NodeID: nodeID,
|
|
|
|
AuditOutcome: overlay.AuditOffline,
|
|
|
|
AuditHistory: *config,
|
|
|
|
|
|
|
|
AuditLambda: 0.95,
|
|
|
|
AuditWeight: 1,
|
|
|
|
AuditDQ: 0.6,
|
|
|
|
SuspensionGracePeriod: time.Hour,
|
|
|
|
SuspensionDQEnabled: true,
|
|
|
|
AuditsRequiredForVetting: 0,
|
|
|
|
}
|
|
|
|
windowTime := time.Now()
|
|
|
|
for i := 0; i <= int(config.TrackingPeriod/config.WindowSize); i++ {
|
|
|
|
_, err := oc.UpdateStats(ctx, updateReq, windowTime)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
windowTime = windowTime.Add(time.Hour)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|