2019-08-22 15:33:14 +01:00
|
|
|
// Copyright (C) 2019 Storj Labs, Inc.
|
|
|
|
// See LICENSE for copying information.
|
|
|
|
|
|
|
|
package orders_test
|
|
|
|
|
|
|
|
import (
|
|
|
|
"testing"
|
|
|
|
"time"
|
|
|
|
|
|
|
|
"github.com/stretchr/testify/require"
|
|
|
|
|
2020-07-01 23:05:01 +01:00
|
|
|
"storj.io/common/memory"
|
2019-12-27 11:48:47 +00:00
|
|
|
"storj.io/common/pb"
|
2020-07-01 23:05:01 +01:00
|
|
|
"storj.io/common/signing"
|
2019-12-27 11:48:47 +00:00
|
|
|
"storj.io/common/testcontext"
|
|
|
|
"storj.io/common/testrand"
|
2019-11-14 19:46:15 +00:00
|
|
|
"storj.io/storj/private/testplanet"
|
2021-04-21 13:42:57 +01:00
|
|
|
"storj.io/storj/satellite/metabase"
|
2023-07-07 09:31:58 +01:00
|
|
|
"storj.io/storj/satellite/nodeselection"
|
2019-08-22 15:33:14 +01:00
|
|
|
"storj.io/storj/storagenode"
|
|
|
|
"storj.io/storj/storagenode/orders"
|
2020-10-01 23:52:22 +01:00
|
|
|
"storj.io/storj/storagenode/orders/ordersfile"
|
2019-08-22 15:33:14 +01:00
|
|
|
)
|
|
|
|
|
2020-07-01 23:05:01 +01:00
|
|
|
// TODO remove when db is removed.
|
|
|
|
func TestOrderDBSettle(t *testing.T) {
|
|
|
|
testplanet.Run(t, testplanet.Config{
|
|
|
|
SatelliteCount: 1, StorageNodeCount: 1, UplinkCount: 1,
|
|
|
|
}, func(t *testing.T, ctx *testcontext.Context, planet *testplanet.Planet) {
|
|
|
|
satellite := planet.Satellites[0]
|
|
|
|
satellite.Audit.Worker.Loop.Pause()
|
|
|
|
node := planet.StorageNodes[0]
|
|
|
|
service := node.Storage2.Orders
|
|
|
|
service.Sender.Pause()
|
|
|
|
service.Cleanup.Pause()
|
|
|
|
|
2020-11-18 21:39:13 +00:00
|
|
|
bucketname := "testbucket"
|
|
|
|
err := planet.Uplinks[0].CreateBucket(ctx, satellite, bucketname)
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
2020-07-01 23:05:01 +01:00
|
|
|
_, orderLimits, piecePrivateKey, err := satellite.Orders.Service.CreatePutOrderLimits(
|
|
|
|
ctx,
|
2020-11-18 21:39:13 +00:00
|
|
|
metabase.BucketLocation{ProjectID: planet.Uplinks[0].Projects[0].ID, BucketName: bucketname},
|
2023-07-07 09:31:58 +01:00
|
|
|
[]*nodeselection.SelectedNode{
|
2020-07-01 23:05:01 +01:00
|
|
|
{ID: node.ID(), LastIPPort: "fake", Address: new(pb.NodeAddress)},
|
|
|
|
},
|
|
|
|
time.Now().Add(2*time.Hour),
|
|
|
|
2000,
|
|
|
|
)
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, orderLimits, 1)
|
|
|
|
|
|
|
|
orderLimit := orderLimits[0].Limit
|
|
|
|
order := &pb.Order{
|
|
|
|
SerialNumber: orderLimit.SerialNumber,
|
|
|
|
Amount: 1000,
|
|
|
|
}
|
|
|
|
signedOrder, err := signing.SignUplinkOrder(ctx, piecePrivateKey, order)
|
|
|
|
require.NoError(t, err)
|
2020-10-01 23:52:22 +01:00
|
|
|
order0 := &ordersfile.Info{
|
2020-07-01 23:05:01 +01:00
|
|
|
Limit: orderLimit,
|
|
|
|
Order: signedOrder,
|
|
|
|
}
|
|
|
|
|
|
|
|
// enter orders into unsent_orders
|
|
|
|
err = node.DB.Orders().Enqueue(ctx, order0)
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
toSend, err := node.DB.Orders().ListUnsent(ctx, 10)
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, toSend, 1)
|
|
|
|
|
|
|
|
// trigger order send
|
|
|
|
service.Sender.TriggerWait()
|
|
|
|
|
2020-10-20 19:54:17 +01:00
|
|
|
// in phase3 the orders are only sent from the filestore
|
|
|
|
// so we expect any orders in ordersDB will remain there
|
2020-07-01 23:05:01 +01:00
|
|
|
toSend, err = node.DB.Orders().ListUnsent(ctx, 10)
|
|
|
|
require.NoError(t, err)
|
2020-10-20 19:54:17 +01:00
|
|
|
require.Len(t, toSend, 1)
|
2020-07-01 23:05:01 +01:00
|
|
|
|
|
|
|
archived, err := node.DB.Orders().ListArchived(ctx, 10)
|
|
|
|
require.NoError(t, err)
|
2020-10-20 19:54:17 +01:00
|
|
|
require.Len(t, archived, 0)
|
2020-07-01 23:05:01 +01:00
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
func TestOrderFileStoreSettle(t *testing.T) {
|
|
|
|
testplanet.Run(t, testplanet.Config{
|
|
|
|
SatelliteCount: 1, StorageNodeCount: 1, UplinkCount: 1,
|
|
|
|
}, func(t *testing.T, ctx *testcontext.Context, planet *testplanet.Planet) {
|
|
|
|
satellite := planet.Satellites[0]
|
|
|
|
uplinkPeer := planet.Uplinks[0]
|
|
|
|
satellite.Audit.Worker.Loop.Pause()
|
|
|
|
node := planet.StorageNodes[0]
|
|
|
|
service := node.Storage2.Orders
|
|
|
|
service.Sender.Pause()
|
|
|
|
service.Cleanup.Pause()
|
storagenode: live tracking of order window usage
This change accomplishes multiple things:
1. Instead of having a max in flight time, which means
we effectively have a minimum bandwidth for uploads
and downloads, we keep track of what windows have
active requests happening in them.
2. We don't double check when we save the order to see if it
is too old: by then, it's too late. A malicious uplink
could just submit orders outside of the grace window and
receive all the data, but the node would just not commit
it, so the uplink gets free traffic. Because the endpoints
also check for the order being too old, this would be a
very tight race that depends on knowledge of the node system
clock, but best to not have the race exist. Instead, we piggy
back off of the in flight tracking and do the check when
we start to handle the order, and commit at the end.
3. Change the functions that send orders and list unsent
orders to accept a time at which that operation is
happening. This way, in tests, we can pretend we're
listing or sending far into the future after the windows
are available to send, rather than exposing test functions
to modify internal state about the grace period to get
the desired effect. This brings tests closer to actual
usage in production.
4. Change the calculation for if an order is allowed to be
enqueued due to the grace period to just look at the
order creation time, rather than some computation involving
the window it will be in. In this way, you can easily
answer the question of "will this order be accepted?" by
asking "is it older than X?" where X is the grace period.
5. Increases the frequency we check to send up orders to once
every 5 minutes instead of once every hour because we already
have hour-long buffering due to the windows. This decreases
the maximum latency that an order will be reported back to
the satellite by 55 minutes.
Change-Id: Ie08b90d139d45ee89b82347e191a2f8db1b88036
2020-08-12 20:01:43 +01:00
|
|
|
tomorrow := time.Now().Add(24 * time.Hour)
|
2020-07-01 23:05:01 +01:00
|
|
|
|
|
|
|
// upload a file to generate an order on the storagenode
|
|
|
|
testData := testrand.Bytes(8 * memory.KiB)
|
|
|
|
err := uplinkPeer.Upload(ctx, satellite, "testbucket", "test/path", testData)
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
2020-11-18 13:38:03 +00:00
|
|
|
require.NoError(t, planet.WaitForStorageNodeEndpoints(ctx))
|
|
|
|
|
2020-10-15 19:57:02 +01:00
|
|
|
toSend, err := node.OrdersStore.ListUnsentBySatellite(ctx, tomorrow)
|
2020-07-01 23:05:01 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, toSend, 1)
|
|
|
|
ordersForSat := toSend[satellite.ID()]
|
|
|
|
require.Len(t, ordersForSat.InfoList, 1)
|
|
|
|
|
|
|
|
// trigger order send
|
storagenode: live tracking of order window usage
This change accomplishes multiple things:
1. Instead of having a max in flight time, which means
we effectively have a minimum bandwidth for uploads
and downloads, we keep track of what windows have
active requests happening in them.
2. We don't double check when we save the order to see if it
is too old: by then, it's too late. A malicious uplink
could just submit orders outside of the grace window and
receive all the data, but the node would just not commit
it, so the uplink gets free traffic. Because the endpoints
also check for the order being too old, this would be a
very tight race that depends on knowledge of the node system
clock, but best to not have the race exist. Instead, we piggy
back off of the in flight tracking and do the check when
we start to handle the order, and commit at the end.
3. Change the functions that send orders and list unsent
orders to accept a time at which that operation is
happening. This way, in tests, we can pretend we're
listing or sending far into the future after the windows
are available to send, rather than exposing test functions
to modify internal state about the grace period to get
the desired effect. This brings tests closer to actual
usage in production.
4. Change the calculation for if an order is allowed to be
enqueued due to the grace period to just look at the
order creation time, rather than some computation involving
the window it will be in. In this way, you can easily
answer the question of "will this order be accepted?" by
asking "is it older than X?" where X is the grace period.
5. Increases the frequency we check to send up orders to once
every 5 minutes instead of once every hour because we already
have hour-long buffering due to the windows. This decreases
the maximum latency that an order will be reported back to
the satellite by 55 minutes.
Change-Id: Ie08b90d139d45ee89b82347e191a2f8db1b88036
2020-08-12 20:01:43 +01:00
|
|
|
service.SendOrders(ctx, tomorrow)
|
2020-07-01 23:05:01 +01:00
|
|
|
|
2020-10-15 19:57:02 +01:00
|
|
|
toSend, err = node.OrdersStore.ListUnsentBySatellite(ctx, tomorrow)
|
2020-07-01 23:05:01 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, toSend, 0)
|
|
|
|
|
|
|
|
archived, err := node.OrdersStore.ListArchived()
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, archived, 1)
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
// TODO remove when db is removed.
|
2020-10-15 19:57:02 +01:00
|
|
|
// TestOrderFileStoreAndDBSettle ensures that if orders exist in both DB and filestore, that the DB orders and filestore are both settled.
|
2020-07-01 23:05:01 +01:00
|
|
|
func TestOrderFileStoreAndDBSettle(t *testing.T) {
|
|
|
|
testplanet.Run(t, testplanet.Config{
|
|
|
|
SatelliteCount: 1, StorageNodeCount: 1, UplinkCount: 1,
|
|
|
|
}, func(t *testing.T, ctx *testcontext.Context, planet *testplanet.Planet) {
|
|
|
|
satellite := planet.Satellites[0]
|
|
|
|
uplinkPeer := planet.Uplinks[0]
|
|
|
|
satellite.Audit.Worker.Loop.Pause()
|
|
|
|
node := planet.StorageNodes[0]
|
|
|
|
service := node.Storage2.Orders
|
|
|
|
service.Sender.Pause()
|
|
|
|
service.Cleanup.Pause()
|
storagenode: live tracking of order window usage
This change accomplishes multiple things:
1. Instead of having a max in flight time, which means
we effectively have a minimum bandwidth for uploads
and downloads, we keep track of what windows have
active requests happening in them.
2. We don't double check when we save the order to see if it
is too old: by then, it's too late. A malicious uplink
could just submit orders outside of the grace window and
receive all the data, but the node would just not commit
it, so the uplink gets free traffic. Because the endpoints
also check for the order being too old, this would be a
very tight race that depends on knowledge of the node system
clock, but best to not have the race exist. Instead, we piggy
back off of the in flight tracking and do the check when
we start to handle the order, and commit at the end.
3. Change the functions that send orders and list unsent
orders to accept a time at which that operation is
happening. This way, in tests, we can pretend we're
listing or sending far into the future after the windows
are available to send, rather than exposing test functions
to modify internal state about the grace period to get
the desired effect. This brings tests closer to actual
usage in production.
4. Change the calculation for if an order is allowed to be
enqueued due to the grace period to just look at the
order creation time, rather than some computation involving
the window it will be in. In this way, you can easily
answer the question of "will this order be accepted?" by
asking "is it older than X?" where X is the grace period.
5. Increases the frequency we check to send up orders to once
every 5 minutes instead of once every hour because we already
have hour-long buffering due to the windows. This decreases
the maximum latency that an order will be reported back to
the satellite by 55 minutes.
Change-Id: Ie08b90d139d45ee89b82347e191a2f8db1b88036
2020-08-12 20:01:43 +01:00
|
|
|
tomorrow := time.Now().Add(24 * time.Hour)
|
2020-07-01 23:05:01 +01:00
|
|
|
|
2020-11-18 21:39:13 +00:00
|
|
|
bucketname := "testbucket"
|
|
|
|
err := uplinkPeer.CreateBucket(ctx, satellite, bucketname)
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
2020-07-01 23:05:01 +01:00
|
|
|
// add orders to orders DB
|
|
|
|
_, orderLimits, piecePrivateKey, err := satellite.Orders.Service.CreatePutOrderLimits(
|
|
|
|
ctx,
|
2020-11-18 21:39:13 +00:00
|
|
|
metabase.BucketLocation{ProjectID: uplinkPeer.Projects[0].ID, BucketName: bucketname},
|
2023-07-07 09:31:58 +01:00
|
|
|
[]*nodeselection.SelectedNode{
|
2020-07-01 23:05:01 +01:00
|
|
|
{ID: node.ID(), LastIPPort: "fake", Address: new(pb.NodeAddress)},
|
|
|
|
},
|
|
|
|
time.Now().Add(2*time.Hour),
|
|
|
|
2000,
|
|
|
|
)
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, orderLimits, 1)
|
|
|
|
|
|
|
|
orderLimit := orderLimits[0].Limit
|
|
|
|
order := &pb.Order{
|
|
|
|
SerialNumber: orderLimit.SerialNumber,
|
|
|
|
Amount: 1000,
|
|
|
|
}
|
|
|
|
signedOrder, err := signing.SignUplinkOrder(ctx, piecePrivateKey, order)
|
|
|
|
require.NoError(t, err)
|
2020-10-01 23:52:22 +01:00
|
|
|
order0 := &ordersfile.Info{
|
2020-07-01 23:05:01 +01:00
|
|
|
Limit: orderLimit,
|
|
|
|
Order: signedOrder,
|
|
|
|
}
|
|
|
|
|
|
|
|
// enter orders into unsent_orders
|
|
|
|
err = node.DB.Orders().Enqueue(ctx, order0)
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
toSendDB, err := node.DB.Orders().ListUnsent(ctx, 10)
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, toSendDB, 1)
|
|
|
|
|
|
|
|
// upload a file to add orders to filestore
|
|
|
|
testData := testrand.Bytes(8 * memory.KiB)
|
|
|
|
err = uplinkPeer.Upload(ctx, satellite, "testbucket", "test/path", testData)
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
2020-11-18 13:38:03 +00:00
|
|
|
require.NoError(t, planet.WaitForStorageNodeEndpoints(ctx))
|
|
|
|
|
2020-10-15 19:57:02 +01:00
|
|
|
toSendFileStore, err := node.OrdersStore.ListUnsentBySatellite(ctx, tomorrow)
|
2020-07-01 23:05:01 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, toSendFileStore, 1)
|
|
|
|
ordersForSat := toSendFileStore[satellite.ID()]
|
|
|
|
require.Len(t, ordersForSat.InfoList, 1)
|
|
|
|
|
|
|
|
// trigger order send
|
storagenode: live tracking of order window usage
This change accomplishes multiple things:
1. Instead of having a max in flight time, which means
we effectively have a minimum bandwidth for uploads
and downloads, we keep track of what windows have
active requests happening in them.
2. We don't double check when we save the order to see if it
is too old: by then, it's too late. A malicious uplink
could just submit orders outside of the grace window and
receive all the data, but the node would just not commit
it, so the uplink gets free traffic. Because the endpoints
also check for the order being too old, this would be a
very tight race that depends on knowledge of the node system
clock, but best to not have the race exist. Instead, we piggy
back off of the in flight tracking and do the check when
we start to handle the order, and commit at the end.
3. Change the functions that send orders and list unsent
orders to accept a time at which that operation is
happening. This way, in tests, we can pretend we're
listing or sending far into the future after the windows
are available to send, rather than exposing test functions
to modify internal state about the grace period to get
the desired effect. This brings tests closer to actual
usage in production.
4. Change the calculation for if an order is allowed to be
enqueued due to the grace period to just look at the
order creation time, rather than some computation involving
the window it will be in. In this way, you can easily
answer the question of "will this order be accepted?" by
asking "is it older than X?" where X is the grace period.
5. Increases the frequency we check to send up orders to once
every 5 minutes instead of once every hour because we already
have hour-long buffering due to the windows. This decreases
the maximum latency that an order will be reported back to
the satellite by 55 minutes.
Change-Id: Ie08b90d139d45ee89b82347e191a2f8db1b88036
2020-08-12 20:01:43 +01:00
|
|
|
service.SendOrders(ctx, tomorrow)
|
2020-07-01 23:05:01 +01:00
|
|
|
|
2020-10-20 19:54:17 +01:00
|
|
|
// DB should not be archived in phase3, but and filestore orders should be archived.
|
2020-07-01 23:05:01 +01:00
|
|
|
toSendDB, err = node.DB.Orders().ListUnsent(ctx, 10)
|
|
|
|
require.NoError(t, err)
|
2020-10-20 19:54:17 +01:00
|
|
|
require.Len(t, toSendDB, 1)
|
2020-07-01 23:05:01 +01:00
|
|
|
|
|
|
|
archived, err := node.DB.Orders().ListArchived(ctx, 10)
|
|
|
|
require.NoError(t, err)
|
2020-10-20 19:54:17 +01:00
|
|
|
require.Len(t, archived, 0)
|
2020-07-01 23:05:01 +01:00
|
|
|
|
2020-10-15 19:57:02 +01:00
|
|
|
toSendFileStore, err = node.OrdersStore.ListUnsentBySatellite(ctx, tomorrow)
|
2020-07-01 23:05:01 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, toSendFileStore, 0)
|
2020-10-15 19:57:02 +01:00
|
|
|
filestoreArchived, err := node.OrdersStore.ListArchived()
|
2020-07-01 23:05:01 +01:00
|
|
|
require.NoError(t, err)
|
2020-10-15 19:57:02 +01:00
|
|
|
require.Len(t, filestoreArchived, 1)
|
2020-07-01 23:05:01 +01:00
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
// TODO remove when db is removed.
|
|
|
|
func TestCleanArchiveDB(t *testing.T) {
|
2019-08-22 15:33:14 +01:00
|
|
|
testplanet.Run(t, testplanet.Config{
|
|
|
|
SatelliteCount: 1, StorageNodeCount: 1, UplinkCount: 0,
|
|
|
|
}, func(t *testing.T, ctx *testcontext.Context, planet *testplanet.Planet) {
|
2019-09-11 23:37:01 +01:00
|
|
|
planet.Satellites[0].Audit.Worker.Loop.Pause()
|
2019-08-22 15:33:14 +01:00
|
|
|
satellite := planet.Satellites[0].ID()
|
|
|
|
node := planet.StorageNodes[0]
|
|
|
|
service := node.Storage2.Orders
|
|
|
|
service.Sender.Pause()
|
|
|
|
service.Cleanup.Pause()
|
|
|
|
|
|
|
|
serialNumber0 := testrand.SerialNumber()
|
|
|
|
serialNumber1 := testrand.SerialNumber()
|
|
|
|
|
2020-10-01 23:52:22 +01:00
|
|
|
order0 := &ordersfile.Info{
|
2019-08-22 15:33:14 +01:00
|
|
|
Limit: &pb.OrderLimit{
|
|
|
|
SatelliteId: satellite,
|
|
|
|
SerialNumber: serialNumber0,
|
|
|
|
},
|
|
|
|
Order: &pb.Order{},
|
|
|
|
}
|
2020-10-01 23:52:22 +01:00
|
|
|
order1 := &ordersfile.Info{
|
2019-08-22 15:33:14 +01:00
|
|
|
Limit: &pb.OrderLimit{
|
|
|
|
SatelliteId: satellite,
|
|
|
|
SerialNumber: serialNumber1,
|
|
|
|
},
|
|
|
|
Order: &pb.Order{},
|
|
|
|
}
|
|
|
|
|
|
|
|
// enter orders into unsent_orders
|
|
|
|
err := node.DB.Orders().Enqueue(ctx, order0)
|
|
|
|
require.NoError(t, err)
|
|
|
|
err = node.DB.Orders().Enqueue(ctx, order1)
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
2020-03-10 22:05:01 +00:00
|
|
|
now := time.Now()
|
storagenode: live tracking of order window usage
This change accomplishes multiple things:
1. Instead of having a max in flight time, which means
we effectively have a minimum bandwidth for uploads
and downloads, we keep track of what windows have
active requests happening in them.
2. We don't double check when we save the order to see if it
is too old: by then, it's too late. A malicious uplink
could just submit orders outside of the grace window and
receive all the data, but the node would just not commit
it, so the uplink gets free traffic. Because the endpoints
also check for the order being too old, this would be a
very tight race that depends on knowledge of the node system
clock, but best to not have the race exist. Instead, we piggy
back off of the in flight tracking and do the check when
we start to handle the order, and commit at the end.
3. Change the functions that send orders and list unsent
orders to accept a time at which that operation is
happening. This way, in tests, we can pretend we're
listing or sending far into the future after the windows
are available to send, rather than exposing test functions
to modify internal state about the grace period to get
the desired effect. This brings tests closer to actual
usage in production.
4. Change the calculation for if an order is allowed to be
enqueued due to the grace period to just look at the
order creation time, rather than some computation involving
the window it will be in. In this way, you can easily
answer the question of "will this order be accepted?" by
asking "is it older than X?" where X is the grace period.
5. Increases the frequency we check to send up orders to once
every 5 minutes instead of once every hour because we already
have hour-long buffering due to the windows. This decreases
the maximum latency that an order will be reported back to
the satellite by 55 minutes.
Change-Id: Ie08b90d139d45ee89b82347e191a2f8db1b88036
2020-08-12 20:01:43 +01:00
|
|
|
yesterday := now.Add(-24 * time.Hour)
|
2019-08-22 15:33:14 +01:00
|
|
|
|
|
|
|
// archive one order yesterday, one today
|
|
|
|
err = node.DB.Orders().Archive(ctx, yesterday, orders.ArchiveRequest{
|
|
|
|
Satellite: satellite,
|
|
|
|
Serial: serialNumber0,
|
|
|
|
Status: orders.StatusAccepted,
|
|
|
|
})
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
err = node.DB.Orders().Archive(ctx, now, orders.ArchiveRequest{
|
|
|
|
Satellite: satellite,
|
|
|
|
Serial: serialNumber1,
|
|
|
|
Status: orders.StatusAccepted,
|
|
|
|
})
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
storagenode: live tracking of order window usage
This change accomplishes multiple things:
1. Instead of having a max in flight time, which means
we effectively have a minimum bandwidth for uploads
and downloads, we keep track of what windows have
active requests happening in them.
2. We don't double check when we save the order to see if it
is too old: by then, it's too late. A malicious uplink
could just submit orders outside of the grace window and
receive all the data, but the node would just not commit
it, so the uplink gets free traffic. Because the endpoints
also check for the order being too old, this would be a
very tight race that depends on knowledge of the node system
clock, but best to not have the race exist. Instead, we piggy
back off of the in flight tracking and do the check when
we start to handle the order, and commit at the end.
3. Change the functions that send orders and list unsent
orders to accept a time at which that operation is
happening. This way, in tests, we can pretend we're
listing or sending far into the future after the windows
are available to send, rather than exposing test functions
to modify internal state about the grace period to get
the desired effect. This brings tests closer to actual
usage in production.
4. Change the calculation for if an order is allowed to be
enqueued due to the grace period to just look at the
order creation time, rather than some computation involving
the window it will be in. In this way, you can easily
answer the question of "will this order be accepted?" by
asking "is it older than X?" where X is the grace period.
5. Increases the frequency we check to send up orders to once
every 5 minutes instead of once every hour because we already
have hour-long buffering due to the windows. This decreases
the maximum latency that an order will be reported back to
the satellite by 55 minutes.
Change-Id: Ie08b90d139d45ee89b82347e191a2f8db1b88036
2020-08-12 20:01:43 +01:00
|
|
|
// trigger cleanup of archived orders older than 12 hours
|
|
|
|
require.NoError(t, service.CleanArchive(ctx, now.Add(-12*time.Hour)))
|
2019-08-22 15:33:14 +01:00
|
|
|
|
|
|
|
archived, err := node.DB.Orders().ListArchived(ctx, 10)
|
|
|
|
require.NoError(t, err)
|
2020-04-30 13:00:06 +01:00
|
|
|
|
2019-08-22 15:33:14 +01:00
|
|
|
require.Len(t, archived, 1)
|
|
|
|
require.Equal(t, archived[0].Limit.SerialNumber, serialNumber1)
|
|
|
|
})
|
|
|
|
}
|
2020-07-01 23:05:01 +01:00
|
|
|
|
|
|
|
func TestCleanArchiveFileStore(t *testing.T) {
|
|
|
|
testplanet.Run(t, testplanet.Config{
|
|
|
|
SatelliteCount: 1, StorageNodeCount: 1, UplinkCount: 0,
|
|
|
|
Reconfigure: testplanet.Reconfigure{
|
storagenode: live tracking of order window usage
This change accomplishes multiple things:
1. Instead of having a max in flight time, which means
we effectively have a minimum bandwidth for uploads
and downloads, we keep track of what windows have
active requests happening in them.
2. We don't double check when we save the order to see if it
is too old: by then, it's too late. A malicious uplink
could just submit orders outside of the grace window and
receive all the data, but the node would just not commit
it, so the uplink gets free traffic. Because the endpoints
also check for the order being too old, this would be a
very tight race that depends on knowledge of the node system
clock, but best to not have the race exist. Instead, we piggy
back off of the in flight tracking and do the check when
we start to handle the order, and commit at the end.
3. Change the functions that send orders and list unsent
orders to accept a time at which that operation is
happening. This way, in tests, we can pretend we're
listing or sending far into the future after the windows
are available to send, rather than exposing test functions
to modify internal state about the grace period to get
the desired effect. This brings tests closer to actual
usage in production.
4. Change the calculation for if an order is allowed to be
enqueued due to the grace period to just look at the
order creation time, rather than some computation involving
the window it will be in. In this way, you can easily
answer the question of "will this order be accepted?" by
asking "is it older than X?" where X is the grace period.
5. Increases the frequency we check to send up orders to once
every 5 minutes instead of once every hour because we already
have hour-long buffering due to the windows. This decreases
the maximum latency that an order will be reported back to
the satellite by 55 minutes.
Change-Id: Ie08b90d139d45ee89b82347e191a2f8db1b88036
2020-08-12 20:01:43 +01:00
|
|
|
StorageNode: func(_ int, config *storagenode.Config) {
|
|
|
|
// A large grace period so we can write to multiple buckets at once
|
|
|
|
config.Storage2.OrderLimitGracePeriod = 48 * time.Hour
|
2020-07-01 23:05:01 +01:00
|
|
|
},
|
|
|
|
},
|
|
|
|
}, func(t *testing.T, ctx *testcontext.Context, planet *testplanet.Planet) {
|
|
|
|
planet.Satellites[0].Audit.Worker.Loop.Pause()
|
|
|
|
satellite := planet.Satellites[0].ID()
|
|
|
|
node := planet.StorageNodes[0]
|
|
|
|
service := node.Storage2.Orders
|
|
|
|
service.Sender.Pause()
|
|
|
|
service.Cleanup.Pause()
|
storagenode: live tracking of order window usage
This change accomplishes multiple things:
1. Instead of having a max in flight time, which means
we effectively have a minimum bandwidth for uploads
and downloads, we keep track of what windows have
active requests happening in them.
2. We don't double check when we save the order to see if it
is too old: by then, it's too late. A malicious uplink
could just submit orders outside of the grace window and
receive all the data, but the node would just not commit
it, so the uplink gets free traffic. Because the endpoints
also check for the order being too old, this would be a
very tight race that depends on knowledge of the node system
clock, but best to not have the race exist. Instead, we piggy
back off of the in flight tracking and do the check when
we start to handle the order, and commit at the end.
3. Change the functions that send orders and list unsent
orders to accept a time at which that operation is
happening. This way, in tests, we can pretend we're
listing or sending far into the future after the windows
are available to send, rather than exposing test functions
to modify internal state about the grace period to get
the desired effect. This brings tests closer to actual
usage in production.
4. Change the calculation for if an order is allowed to be
enqueued due to the grace period to just look at the
order creation time, rather than some computation involving
the window it will be in. In this way, you can easily
answer the question of "will this order be accepted?" by
asking "is it older than X?" where X is the grace period.
5. Increases the frequency we check to send up orders to once
every 5 minutes instead of once every hour because we already
have hour-long buffering due to the windows. This decreases
the maximum latency that an order will be reported back to
the satellite by 55 minutes.
Change-Id: Ie08b90d139d45ee89b82347e191a2f8db1b88036
2020-08-12 20:01:43 +01:00
|
|
|
now := time.Now()
|
|
|
|
yesterday := now.Add(-24 * time.Hour)
|
2020-07-01 23:05:01 +01:00
|
|
|
|
|
|
|
serialNumber0 := testrand.SerialNumber()
|
storagenode: live tracking of order window usage
This change accomplishes multiple things:
1. Instead of having a max in flight time, which means
we effectively have a minimum bandwidth for uploads
and downloads, we keep track of what windows have
active requests happening in them.
2. We don't double check when we save the order to see if it
is too old: by then, it's too late. A malicious uplink
could just submit orders outside of the grace window and
receive all the data, but the node would just not commit
it, so the uplink gets free traffic. Because the endpoints
also check for the order being too old, this would be a
very tight race that depends on knowledge of the node system
clock, but best to not have the race exist. Instead, we piggy
back off of the in flight tracking and do the check when
we start to handle the order, and commit at the end.
3. Change the functions that send orders and list unsent
orders to accept a time at which that operation is
happening. This way, in tests, we can pretend we're
listing or sending far into the future after the windows
are available to send, rather than exposing test functions
to modify internal state about the grace period to get
the desired effect. This brings tests closer to actual
usage in production.
4. Change the calculation for if an order is allowed to be
enqueued due to the grace period to just look at the
order creation time, rather than some computation involving
the window it will be in. In this way, you can easily
answer the question of "will this order be accepted?" by
asking "is it older than X?" where X is the grace period.
5. Increases the frequency we check to send up orders to once
every 5 minutes instead of once every hour because we already
have hour-long buffering due to the windows. This decreases
the maximum latency that an order will be reported back to
the satellite by 55 minutes.
Change-Id: Ie08b90d139d45ee89b82347e191a2f8db1b88036
2020-08-12 20:01:43 +01:00
|
|
|
createdAt0 := now
|
2020-07-01 23:05:01 +01:00
|
|
|
serialNumber1 := testrand.SerialNumber()
|
storagenode: live tracking of order window usage
This change accomplishes multiple things:
1. Instead of having a max in flight time, which means
we effectively have a minimum bandwidth for uploads
and downloads, we keep track of what windows have
active requests happening in them.
2. We don't double check when we save the order to see if it
is too old: by then, it's too late. A malicious uplink
could just submit orders outside of the grace window and
receive all the data, but the node would just not commit
it, so the uplink gets free traffic. Because the endpoints
also check for the order being too old, this would be a
very tight race that depends on knowledge of the node system
clock, but best to not have the race exist. Instead, we piggy
back off of the in flight tracking and do the check when
we start to handle the order, and commit at the end.
3. Change the functions that send orders and list unsent
orders to accept a time at which that operation is
happening. This way, in tests, we can pretend we're
listing or sending far into the future after the windows
are available to send, rather than exposing test functions
to modify internal state about the grace period to get
the desired effect. This brings tests closer to actual
usage in production.
4. Change the calculation for if an order is allowed to be
enqueued due to the grace period to just look at the
order creation time, rather than some computation involving
the window it will be in. In this way, you can easily
answer the question of "will this order be accepted?" by
asking "is it older than X?" where X is the grace period.
5. Increases the frequency we check to send up orders to once
every 5 minutes instead of once every hour because we already
have hour-long buffering due to the windows. This decreases
the maximum latency that an order will be reported back to
the satellite by 55 minutes.
Change-Id: Ie08b90d139d45ee89b82347e191a2f8db1b88036
2020-08-12 20:01:43 +01:00
|
|
|
createdAt1 := now.Add(-24 * time.Hour)
|
2020-07-01 23:05:01 +01:00
|
|
|
|
2020-10-01 23:52:22 +01:00
|
|
|
order0 := &ordersfile.Info{
|
2020-07-01 23:05:01 +01:00
|
|
|
Limit: &pb.OrderLimit{
|
|
|
|
SatelliteId: satellite,
|
|
|
|
SerialNumber: serialNumber0,
|
|
|
|
OrderCreation: createdAt0,
|
|
|
|
},
|
|
|
|
Order: &pb.Order{},
|
|
|
|
}
|
2020-10-01 23:52:22 +01:00
|
|
|
order1 := &ordersfile.Info{
|
2020-07-01 23:05:01 +01:00
|
|
|
Limit: &pb.OrderLimit{
|
|
|
|
SatelliteId: satellite,
|
|
|
|
SerialNumber: serialNumber1,
|
|
|
|
OrderCreation: createdAt1,
|
|
|
|
},
|
|
|
|
Order: &pb.Order{},
|
|
|
|
}
|
|
|
|
|
|
|
|
// enqueue both orders; they will be placed in separate buckets because they have different creation hours
|
|
|
|
err := node.OrdersStore.Enqueue(order0)
|
|
|
|
require.NoError(t, err)
|
|
|
|
err = node.OrdersStore.Enqueue(order1)
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
// archive one order yesterday, one today
|
2020-10-06 17:14:25 +01:00
|
|
|
unsentInfo := orders.UnsentInfo{Version: ordersfile.V1}
|
2020-10-01 23:52:22 +01:00
|
|
|
unsentInfo.CreatedAtHour = createdAt0.Truncate(time.Hour)
|
|
|
|
err = node.OrdersStore.Archive(satellite, unsentInfo, yesterday, pb.SettlementWithWindowResponse_ACCEPTED)
|
2020-07-01 23:05:01 +01:00
|
|
|
require.NoError(t, err)
|
2020-10-01 23:52:22 +01:00
|
|
|
unsentInfo.CreatedAtHour = createdAt1.Truncate(time.Hour)
|
|
|
|
err = node.OrdersStore.Archive(satellite, unsentInfo, now, pb.SettlementWithWindowResponse_ACCEPTED)
|
2020-07-01 23:05:01 +01:00
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
archived, err := node.OrdersStore.ListArchived()
|
|
|
|
require.NoError(t, err)
|
|
|
|
require.Len(t, archived, 2)
|
|
|
|
|
storagenode: live tracking of order window usage
This change accomplishes multiple things:
1. Instead of having a max in flight time, which means
we effectively have a minimum bandwidth for uploads
and downloads, we keep track of what windows have
active requests happening in them.
2. We don't double check when we save the order to see if it
is too old: by then, it's too late. A malicious uplink
could just submit orders outside of the grace window and
receive all the data, but the node would just not commit
it, so the uplink gets free traffic. Because the endpoints
also check for the order being too old, this would be a
very tight race that depends on knowledge of the node system
clock, but best to not have the race exist. Instead, we piggy
back off of the in flight tracking and do the check when
we start to handle the order, and commit at the end.
3. Change the functions that send orders and list unsent
orders to accept a time at which that operation is
happening. This way, in tests, we can pretend we're
listing or sending far into the future after the windows
are available to send, rather than exposing test functions
to modify internal state about the grace period to get
the desired effect. This brings tests closer to actual
usage in production.
4. Change the calculation for if an order is allowed to be
enqueued due to the grace period to just look at the
order creation time, rather than some computation involving
the window it will be in. In this way, you can easily
answer the question of "will this order be accepted?" by
asking "is it older than X?" where X is the grace period.
5. Increases the frequency we check to send up orders to once
every 5 minutes instead of once every hour because we already
have hour-long buffering due to the windows. This decreases
the maximum latency that an order will be reported back to
the satellite by 55 minutes.
Change-Id: Ie08b90d139d45ee89b82347e191a2f8db1b88036
2020-08-12 20:01:43 +01:00
|
|
|
// trigger cleanup of archived orders older than 12 hours
|
|
|
|
require.NoError(t, service.CleanArchive(ctx, now.Add(-12*time.Hour)))
|
2020-07-01 23:05:01 +01:00
|
|
|
|
|
|
|
archived, err = node.OrdersStore.ListArchived()
|
|
|
|
require.NoError(t, err)
|
|
|
|
|
|
|
|
require.Len(t, archived, 1)
|
|
|
|
require.Equal(t, archived[0].Limit.SerialNumber, serialNumber1)
|
|
|
|
})
|
|
|
|
}
|