// Copyright (C) 2019 Storj Labs, Inc. // See LICENSE for copying information. package streams import ( "bytes" "context" "crypto/rand" "io" "io/ioutil" "strconv" "time" "github.com/gogo/protobuf/proto" "github.com/zeebo/errs" "go.uber.org/zap" monkit "gopkg.in/spacemonkeygo/monkit.v2" "storj.io/storj/pkg/eestream" "storj.io/storj/pkg/encryption" "storj.io/storj/pkg/paths" "storj.io/storj/pkg/pb" "storj.io/storj/pkg/ranger" "storj.io/storj/pkg/storage/meta" "storj.io/storj/pkg/storage/segments" "storj.io/storj/pkg/storj" "storj.io/storj/storage" ) var mon = monkit.Package() // Meta info about a stream type Meta struct { Modified time.Time Expiration time.Time Size int64 Data []byte } // convertMeta converts segment metadata to stream metadata func convertMeta(lastSegmentMeta segments.Meta, stream pb.StreamInfo, streamMeta pb.StreamMeta) Meta { return Meta{ Modified: lastSegmentMeta.Modified, Expiration: lastSegmentMeta.Expiration, Size: ((stream.NumberOfSegments - 1) * stream.SegmentsSize) + stream.LastSegmentSize, Data: stream.Metadata, } } // Store interface methods for streams to satisfy to be a store type typedStore interface { Meta(ctx context.Context, path Path, pathCipher storj.CipherSuite) (Meta, error) Get(ctx context.Context, path Path, pathCipher storj.CipherSuite) (ranger.Ranger, Meta, error) Put(ctx context.Context, path Path, pathCipher storj.CipherSuite, data io.Reader, metadata []byte, expiration time.Time) (Meta, error) Delete(ctx context.Context, path Path, pathCipher storj.CipherSuite) error List(ctx context.Context, prefix Path, startAfter, endBefore string, pathCipher storj.CipherSuite, recursive bool, limit int, metaFlags uint32) (items []ListItem, more bool, err error) } // streamStore is a store for streams. It implements typedStore as part of an ongoing migration // to use typed paths. See the shim for the store that the rest of the world interacts with. type streamStore struct { segments segments.Store segmentSize int64 encStore *encryption.Store encBlockSize int cipher storj.CipherSuite inlineThreshold int } // newTypedStreamStore constructs a typedStore backed by a streamStore. func newTypedStreamStore(segments segments.Store, segmentSize int64, encStore *encryption.Store, encBlockSize int, cipher storj.CipherSuite, inlineThreshold int) (typedStore, error) { if segmentSize <= 0 { return nil, errs.New("segment size must be larger than 0") } if encBlockSize <= 0 { return nil, errs.New("encryption block size must be larger than 0") } return &streamStore{ segments: segments, segmentSize: segmentSize, encStore: encStore, encBlockSize: encBlockSize, cipher: cipher, inlineThreshold: inlineThreshold, }, nil } // Put breaks up data as it comes in into s.segmentSize length pieces, then // store the first piece at s0/, second piece at s1/, and the // *last* piece at l/. Store the given metadata, along with the number // of segments, in a new protobuf, in the metadata of l/. func (s *streamStore) Put(ctx context.Context, path Path, pathCipher storj.CipherSuite, data io.Reader, metadata []byte, expiration time.Time) (m Meta, err error) { defer mon.Task()(&ctx)(&err) // previously file uploaded? err = s.Delete(ctx, path, pathCipher) if err != nil && !storage.ErrKeyNotFound.Has(err) { // something wrong happened checking for an existing // file with the same name return Meta{}, err } m, lastSegment, err := s.upload(ctx, path, pathCipher, data, metadata, expiration) if err != nil { s.cancelHandler(context.Background(), lastSegment, path, pathCipher) } return m, err } func (s *streamStore) upload(ctx context.Context, path Path, pathCipher storj.CipherSuite, data io.Reader, metadata []byte, expiration time.Time) (m Meta, lastSegment int64, err error) { defer mon.Task()(&ctx)(&err) var currentSegment int64 var streamSize int64 var putMeta segments.Meta defer func() { select { case <-ctx.Done(): s.cancelHandler(context.Background(), currentSegment, path, pathCipher) default: } }() derivedKey, err := encryption.DeriveContentKey(path.Bucket(), path.UnencryptedPath(), s.encStore) if err != nil { return Meta{}, currentSegment, err } encPath, err := encryption.EncryptPath(path.Bucket(), path.UnencryptedPath(), pathCipher, s.encStore) if err != nil { return Meta{}, currentSegment, err } eofReader := NewEOFReader(data) for !eofReader.isEOF() && !eofReader.hasError() { // generate random key for encrypting the segment's content var contentKey storj.Key _, err = rand.Read(contentKey[:]) if err != nil { return Meta{}, currentSegment, err } // Initialize the content nonce with the segment's index incremented by 1. // The increment by 1 is to avoid nonce reuse with the metadata encryption, // which is encrypted with the zero nonce. var contentNonce storj.Nonce _, err := encryption.Increment(&contentNonce, currentSegment+1) if err != nil { return Meta{}, currentSegment, err } encrypter, err := encryption.NewEncrypter(s.cipher, &contentKey, &contentNonce, s.encBlockSize) if err != nil { return Meta{}, currentSegment, err } // generate random nonce for encrypting the content key var keyNonce storj.Nonce _, err = rand.Read(keyNonce[:]) if err != nil { return Meta{}, currentSegment, err } encryptedKey, err := encryption.EncryptKey(&contentKey, s.cipher, derivedKey, &keyNonce) if err != nil { return Meta{}, currentSegment, err } sizeReader := NewSizeReader(eofReader) segmentReader := io.LimitReader(sizeReader, s.segmentSize) peekReader := segments.NewPeekThresholdReader(segmentReader) // If the data is larger than the inline threshold size, then it will be a remote segment isRemote, err := peekReader.IsLargerThan(s.inlineThreshold) if err != nil { return Meta{}, currentSegment, err } var transformedReader io.Reader if isRemote { paddedReader := eestream.PadReader(ioutil.NopCloser(peekReader), encrypter.InBlockSize()) transformedReader = encryption.TransformReader(paddedReader, encrypter, 0) } else { data, err := ioutil.ReadAll(peekReader) if err != nil { return Meta{}, currentSegment, err } cipherData, err := encryption.Encrypt(data, s.cipher, &contentKey, &contentNonce) if err != nil { return Meta{}, currentSegment, err } transformedReader = bytes.NewReader(cipherData) } putMeta, err = s.segments.Put(ctx, transformedReader, expiration, func() (storj.Path, []byte, error) { if !eofReader.isEOF() { segmentPath, err := createSegmentPath(ctx, currentSegment, path.Bucket(), encPath) if err != nil { return "", nil, err } if s.cipher == storj.EncNull { return segmentPath, nil, nil } segmentMeta, err := proto.Marshal(&pb.SegmentMeta{ EncryptedKey: encryptedKey, KeyNonce: keyNonce[:], }) if err != nil { return "", nil, err } return segmentPath, segmentMeta, nil } lastSegmentPath, err := createSegmentPath(ctx, -1, path.Bucket(), encPath) if err != nil { return "", nil, err } streamInfo, err := proto.Marshal(&pb.StreamInfo{ NumberOfSegments: currentSegment + 1, SegmentsSize: s.segmentSize, LastSegmentSize: sizeReader.Size(), Metadata: metadata, }) if err != nil { return "", nil, err } // encrypt metadata with the content encryption key and zero nonce encryptedStreamInfo, err := encryption.Encrypt(streamInfo, s.cipher, &contentKey, &storj.Nonce{}) if err != nil { return "", nil, err } streamMeta := pb.StreamMeta{ EncryptedStreamInfo: encryptedStreamInfo, EncryptionType: int32(s.cipher), EncryptionBlockSize: int32(s.encBlockSize), } if s.cipher != storj.EncNull { streamMeta.LastSegmentMeta = &pb.SegmentMeta{ EncryptedKey: encryptedKey, KeyNonce: keyNonce[:], } } lastSegmentMeta, err := proto.Marshal(&streamMeta) if err != nil { return "", nil, err } return lastSegmentPath, lastSegmentMeta, nil }) if err != nil { return Meta{}, currentSegment, err } currentSegment++ streamSize += sizeReader.Size() } if eofReader.hasError() { return Meta{}, currentSegment, eofReader.err } resultMeta := Meta{ Modified: putMeta.Modified, Expiration: expiration, Size: streamSize, Data: metadata, } return resultMeta, currentSegment, nil } // Get returns a ranger that knows what the overall size is (from l/) // and then returns the appropriate data from segments s0/, s1/, // ..., l/. func (s *streamStore) Get(ctx context.Context, path Path, pathCipher storj.CipherSuite) (rr ranger.Ranger, meta Meta, err error) { defer mon.Task()(&ctx)(&err) encPath, err := encryption.EncryptPath(path.Bucket(), path.UnencryptedPath(), pathCipher, s.encStore) if err != nil { return nil, Meta{}, err } segmentPath, err := createSegmentPath(ctx, -1, path.Bucket(), encPath) if err != nil { return nil, Meta{}, err } lastSegmentRanger, lastSegmentMeta, err := s.segments.Get(ctx, segmentPath) if err != nil { return nil, Meta{}, err } streamInfo, streamMeta, err := TypedDecryptStreamInfo(ctx, lastSegmentMeta.Data, path, s.encStore) if err != nil { return nil, Meta{}, err } stream := pb.StreamInfo{} err = proto.Unmarshal(streamInfo, &stream) if err != nil { return nil, Meta{}, err } derivedKey, err := encryption.DeriveContentKey(path.Bucket(), path.UnencryptedPath(), s.encStore) if err != nil { return nil, Meta{}, err } var rangers []ranger.Ranger for i := int64(0); i < stream.NumberOfSegments-1; i++ { currentPath, err := createSegmentPath(ctx, i, path.Bucket(), encPath) if err != nil { return nil, Meta{}, err } var contentNonce storj.Nonce _, err = encryption.Increment(&contentNonce, i+1) if err != nil { return nil, Meta{}, err } rangers = append(rangers, &lazySegmentRanger{ segments: s.segments, path: currentPath, size: stream.SegmentsSize, derivedKey: derivedKey, startingNonce: &contentNonce, encBlockSize: int(streamMeta.EncryptionBlockSize), cipher: storj.CipherSuite(streamMeta.EncryptionType), }) } var contentNonce storj.Nonce _, err = encryption.Increment(&contentNonce, stream.NumberOfSegments) if err != nil { return nil, Meta{}, err } encryptedKey, keyNonce := getEncryptedKeyAndNonce(streamMeta.LastSegmentMeta) decryptedLastSegmentRanger, err := decryptRanger( ctx, lastSegmentRanger, stream.LastSegmentSize, storj.CipherSuite(streamMeta.EncryptionType), derivedKey, encryptedKey, keyNonce, &contentNonce, int(streamMeta.EncryptionBlockSize), ) if err != nil { return nil, Meta{}, err } rangers = append(rangers, decryptedLastSegmentRanger) catRangers := ranger.Concat(rangers...) meta = convertMeta(lastSegmentMeta, stream, streamMeta) return catRangers, meta, nil } // Meta implements Store.Meta func (s *streamStore) Meta(ctx context.Context, path Path, pathCipher storj.CipherSuite) (meta Meta, err error) { defer mon.Task()(&ctx)(&err) encPath, err := encryption.EncryptPath(path.Bucket(), path.UnencryptedPath(), pathCipher, s.encStore) if err != nil { return Meta{}, err } segmentPath, err := createSegmentPath(ctx, -1, path.Bucket(), encPath) if err != nil { return Meta{}, err } lastSegmentMeta, err := s.segments.Meta(ctx, segmentPath) if err != nil { return Meta{}, err } streamInfo, streamMeta, err := TypedDecryptStreamInfo(ctx, lastSegmentMeta.Data, path, s.encStore) if err != nil { return Meta{}, err } var stream pb.StreamInfo if err := proto.Unmarshal(streamInfo, &stream); err != nil { return Meta{}, err } return convertMeta(lastSegmentMeta, stream, streamMeta), nil } // Delete all the segments, with the last one last func (s *streamStore) Delete(ctx context.Context, path Path, pathCipher storj.CipherSuite) (err error) { defer mon.Task()(&ctx)(&err) encPath, err := encryption.EncryptPath(path.Bucket(), path.UnencryptedPath(), pathCipher, s.encStore) if err != nil { return err } lastSegmentPath, err := createSegmentPath(ctx, -1, path.Bucket(), encPath) if err != nil { return err } lastSegmentMeta, err := s.segments.Meta(ctx, lastSegmentPath) if err != nil { return err } streamInfo, _, err := TypedDecryptStreamInfo(ctx, lastSegmentMeta.Data, path, s.encStore) if err != nil { return err } var stream pb.StreamInfo if err := proto.Unmarshal(streamInfo, &stream); err != nil { return err } for i := 0; i < int(stream.NumberOfSegments-1); i++ { currentPath, err := createSegmentPath(ctx, int64(i), path.Bucket(), encPath) if err != nil { return err } err = s.segments.Delete(ctx, currentPath) if err != nil { return err } } return s.segments.Delete(ctx, lastSegmentPath) } // ListItem is a single item in a listing type ListItem struct { Path string Meta Meta IsPrefix bool } // List all the paths inside l/, stripping off the l/ prefix func (s *streamStore) List(ctx context.Context, prefix Path, startAfter, endBefore string, pathCipher storj.CipherSuite, recursive bool, limit int, metaFlags uint32) (items []ListItem, more bool, err error) { defer mon.Task()(&ctx)(&err) if metaFlags&meta.Size != 0 { // Calculating the stream's size require also the user-defined metadata, // where stream store keeps info about the number of segments and their size. metaFlags |= meta.UserDefined } prefixKey, err := encryption.DerivePathKey(prefix.Bucket(), prefix.UnencryptedPath(), s.encStore) if err != nil { return nil, false, err } encPrefix, err := encryption.EncryptPath(prefix.Bucket(), prefix.UnencryptedPath(), pathCipher, s.encStore) if err != nil { return nil, false, err } // We have to encrypt startAfter and endBefore but only if they don't contain a bucket. // They contain a bucket if and only if the prefix has no bucket. This is why they are raw // strings instead of a typed string: it's either a bucket or an unencrypted path component // and that isn't known at compile time. needsEncryption := prefix.Bucket() != "" if needsEncryption { startAfter, err = encryption.EncryptPathRaw(startAfter, pathCipher, prefixKey) if err != nil { return nil, false, err } endBefore, err = encryption.EncryptPathRaw(endBefore, pathCipher, prefixKey) if err != nil { return nil, false, err } } segmentPrefix, err := createSegmentPath(ctx, -1, prefix.Bucket(), encPrefix) if err != nil { return nil, false, err } segments, more, err := s.segments.List(ctx, segmentPrefix, startAfter, endBefore, recursive, limit, metaFlags) if err != nil { return nil, false, err } items = make([]ListItem, len(segments)) for i, item := range segments { var path Path var itemPath string if needsEncryption { itemPath, err = encryption.DecryptPathRaw(item.Path, pathCipher, prefixKey) if err != nil { return nil, false, err } // TODO(jeff): this shouldn't be necessary if we handled trailing slashes // appropriately. there's some issues with list. fullPath := prefix.UnencryptedPath().Raw() if len(fullPath) > 0 && fullPath[len(fullPath)-1] != '/' { fullPath += "/" } fullPath += itemPath path = CreatePath(prefix.Bucket(), paths.NewUnencrypted(fullPath)) } else { itemPath = item.Path path = CreatePath(item.Path, paths.Unencrypted{}) } streamInfo, streamMeta, err := TypedDecryptStreamInfo(ctx, item.Meta.Data, path, s.encStore) if err != nil { return nil, false, err } var stream pb.StreamInfo if err := proto.Unmarshal(streamInfo, &stream); err != nil { return nil, false, err } newMeta := convertMeta(item.Meta, stream, streamMeta) items[i] = ListItem{ Path: itemPath, Meta: newMeta, IsPrefix: item.IsPrefix, } } return items, more, nil } type lazySegmentRanger struct { ranger ranger.Ranger segments segments.Store path storj.Path size int64 derivedKey *storj.Key startingNonce *storj.Nonce encBlockSize int cipher storj.CipherSuite } // Size implements Ranger.Size func (lr *lazySegmentRanger) Size() int64 { return lr.size } // Range implements Ranger.Range to be lazily connected func (lr *lazySegmentRanger) Range(ctx context.Context, offset, length int64) (_ io.ReadCloser, err error) { defer mon.Task()(&ctx)(&err) if lr.ranger == nil { rr, m, err := lr.segments.Get(ctx, lr.path) if err != nil { return nil, err } segmentMeta := pb.SegmentMeta{} err = proto.Unmarshal(m.Data, &segmentMeta) if err != nil { return nil, err } encryptedKey, keyNonce := getEncryptedKeyAndNonce(&segmentMeta) lr.ranger, err = decryptRanger(ctx, rr, lr.size, lr.cipher, lr.derivedKey, encryptedKey, keyNonce, lr.startingNonce, lr.encBlockSize) if err != nil { return nil, err } } return lr.ranger.Range(ctx, offset, length) } // decryptRanger returns a decrypted ranger of the given rr ranger func decryptRanger(ctx context.Context, rr ranger.Ranger, decryptedSize int64, cipher storj.CipherSuite, derivedKey *storj.Key, encryptedKey storj.EncryptedPrivateKey, encryptedKeyNonce, startingNonce *storj.Nonce, encBlockSize int) (decrypted ranger.Ranger, err error) { defer mon.Task()(&ctx)(&err) contentKey, err := encryption.DecryptKey(encryptedKey, cipher, derivedKey, encryptedKeyNonce) if err != nil { return nil, err } decrypter, err := encryption.NewDecrypter(cipher, contentKey, startingNonce, encBlockSize) if err != nil { return nil, err } var rd ranger.Ranger if rr.Size()%int64(decrypter.InBlockSize()) != 0 { reader, err := rr.Range(ctx, 0, rr.Size()) if err != nil { return nil, err } defer func() { err = errs.Combine(err, reader.Close()) }() cipherData, err := ioutil.ReadAll(reader) if err != nil { return nil, err } data, err := encryption.Decrypt(cipherData, cipher, contentKey, startingNonce) if err != nil { return nil, err } return ranger.ByteRanger(data), nil } rd, err = encryption.Transform(rr, decrypter) if err != nil { return nil, err } return eestream.Unpad(rd, int(rd.Size()-decryptedSize)) } // CancelHandler handles clean up of segments on receiving CTRL+C func (s *streamStore) cancelHandler(ctx context.Context, totalSegments int64, path Path, pathCipher storj.CipherSuite) { defer mon.Task()(&ctx)(nil) encPath, err := encryption.EncryptPath(path.Bucket(), path.UnencryptedPath(), pathCipher, s.encStore) if err != nil { zap.S().Warnf("Failed deleting segments: %v", err) return } for i := int64(0); i < totalSegments; i++ { currentPath, err := createSegmentPath(ctx, i, path.Bucket(), encPath) if err != nil { zap.S().Warnf("Failed deleting segment %d: %v", i, err) continue } err = s.segments.Delete(ctx, currentPath) if err != nil { zap.S().Warnf("Failed deleting segment %v: %v", currentPath, err) continue } } } func getEncryptedKeyAndNonce(m *pb.SegmentMeta) (storj.EncryptedPrivateKey, *storj.Nonce) { if m == nil { return nil, nil } var nonce storj.Nonce copy(nonce[:], m.KeyNonce) return m.EncryptedKey, &nonce } // TypedDecryptStreamInfo decrypts stream info func TypedDecryptStreamInfo(ctx context.Context, streamMetaBytes []byte, path Path, encStore *encryption.Store) ( streamInfo []byte, streamMeta pb.StreamMeta, err error) { defer mon.Task()(&ctx)(&err) err = proto.Unmarshal(streamMetaBytes, &streamMeta) if err != nil { return nil, pb.StreamMeta{}, err } derivedKey, err := encryption.DeriveContentKey(path.Bucket(), path.UnencryptedPath(), encStore) if err != nil { return nil, pb.StreamMeta{}, err } cipher := storj.CipherSuite(streamMeta.EncryptionType) encryptedKey, keyNonce := getEncryptedKeyAndNonce(streamMeta.LastSegmentMeta) contentKey, err := encryption.DecryptKey(encryptedKey, cipher, derivedKey, keyNonce) if err != nil { return nil, pb.StreamMeta{}, err } // decrypt metadata with the content encryption key and zero nonce streamInfo, err = encryption.Decrypt(streamMeta.EncryptedStreamInfo, cipher, contentKey, &storj.Nonce{}) return streamInfo, streamMeta, err } // createSegmentPath will create a storj.Path that the segment store expects. func createSegmentPath(ctx context.Context, segmentIndex int64, bucket string, encPath paths.Encrypted) (path storj.Path, err error) { defer mon.Task()(&ctx)(&err) if segmentIndex < -1 { return "", errs.New("invalid segment index") } var raw []byte if segmentIndex > -1 { raw = append(raw, 's') raw = append(raw, strconv.FormatInt(segmentIndex, 10)...) } else { raw = append(raw, 'l') } raw = append(raw, '/') if len(bucket) > 0 { raw = append(raw, bucket...) raw = append(raw, '/') if encPath.Valid() { raw = append(raw, encPath.Raw()...) raw = append(raw, '/') } } return storj.Path(raw[:len(raw)-1]), nil }