cmd/storj-sim: ignore context canceled and flush output

It's possible that content was not being flushed from processes. For now, ignore other process failures under storj-sim network test. Once we get other processes stable, we can repropagate the error. Change-Id: I01ed572d7c779ab6451124f1e24e3d1168b3ea79
2022-08-02 14:52:24 +03:00 · 2022-08-02 14:52:24 +03:00 · 1cb3cbaecf
commit 1cb3cbaecf
parent 98b8c7be06
4 changed files with 129 additions and 17 deletions
--- a/cmd/storj-sim/network.go
+++ b/cmd/storj-sim/network.go
@ -86,6 +86,7 @@ func networkExec(flags *Flags, args []string, command string) error {
 	if err != nil {
 		return err
 	}
 	defer func() { _ = processes.Output.Flush() }()
 	ctx, cancel := NewCLIContext(context.Background())
 	defer cancel()
@ -133,6 +134,7 @@ func networkEnv(flags *Flags, args []string) error {
 	if err != nil {
 		return err
 	}
 	defer func() { _ = processes.Output.Flush() }()
 	// run exec before, since it will load env vars from configs
 	for _, process := range processes.List {
@ -168,6 +170,7 @@ func networkTest(flags *Flags, command string, args []string) error {
 	if err != nil {
 		return err
 	}
 	defer func() { _ = processes.Output.Flush() }()
 	ctx, cancel := NewCLIContext(context.Background())
@ -184,23 +187,33 @@ func networkTest(flags *Flags, command string, args []string) error {
 		process.Status.Started.Wait(ctx)
 	}
 	if err := ctx.Err(); err != nil {
-		return err
+		// If the context has been cancelled, it means that one of the processes failed.
 		// Wait for the processes to shut down themselves and return the first error.
 		return fmt.Errorf("network canceled: %w", group.Wait())
 	}
 	cmd := exec.CommandContext(ctx, command, args...)
 	cmd.Env = append(os.Environ(), processes.Env()...)
 	stdout := processes.Output.Prefixed("test:out")
 	defer func() { _ = stdout.Flush() }()
 	stderr := processes.Output.Prefixed("test:err")
 	defer func() { _ = stderr.Flush() }()
 	cmd.Stdout, cmd.Stderr = stdout, stderr
 	processgroup.Setup(cmd)
 	if printCommands {
 		fmt.Fprintf(processes.Output, "exec: %v\n", strings.Join(cmd.Args, " "))
 	}
 	errRun := cmd.Run()
 	if errRun != nil {
 		fmt.Fprintf(processes.Output, "test command failed: %v\n", errRun)
 	}
 	cancel()
-	return errs.Combine(errRun, processes.Close(), group.Wait())
+	_ = group.Wait()
 	return errs.Combine(errRun, processes.Close())
 }
 func networkDestroy(flags *Flags, args []string) error {
@ -506,7 +519,7 @@ func newNetwork(flags *Flags) (*Processes, error) {
 				var consoleAddress string
 				err := readConfigString(&consoleAddress, satellite.Directory, "console.address")
 				if err != nil {
-					return err
+					return fmt.Errorf("failed to read config string: %w", err)
 				}
 				// try with 100ms delays until we hit 3s
@ -514,14 +527,14 @@ func newNetwork(flags *Flags) (*Processes, error) {
 				for apiKey == "" {
 					apiKey, err = newConsoleEndpoints(consoleAddress).createOrGetAPIKey(context.Background())
 					if err != nil && time.Since(start) > 3*time.Second {
-						return err
+						return fmt.Errorf("failed to create account: %w", err)
 					}
 					time.Sleep(100 * time.Millisecond)
 				}
 				satNodeID, err := identity.NodeIDFromCertPath(filepath.Join(satellite.Directory, "identity.cert"))
 				if err != nil {
-					return err
+					return fmt.Errorf("failed to get node id from path: %w", err)
 				}
 				nodeURL := storj.NodeURL{
 					ID:      satNodeID,
@ -530,17 +543,17 @@ func newNetwork(flags *Flags) (*Processes, error) {
 				access, err := uplink.RequestAccessWithPassphrase(context.Background(), nodeURL.String(), apiKey, "")
 				if err != nil {
-					return err
+					return fmt.Errorf("failed to get passphrase: %w", err)
 				}
 				accessData, err := access.Serialize()
 				if err != nil {
-					return err
+					return fmt.Errorf("failed to serialize access: %w", err)
 				}
 				vip.Set("access", accessData)
 				if err := vip.WriteConfig(); err != nil {
-					return err
+					return fmt.Errorf("failed to write config: %w", err)
 				}
 			}
--- a/cmd/storj-sim/prefix.go
+++ b/cmd/storj-sim/prefix.go
@ -56,8 +56,14 @@ type prefixWriter struct {
 	buffer []byte
 }
 // WriterFlusher implements io.Writer and flushing of pending content.
 type WriterFlusher interface {
 	io.Writer
 	Flush() error
 }
 // Prefixed returns a new writer that has writes with specified prefix.
-func (writer *PrefixWriter) Prefixed(prefix string) io.Writer {
+func (writer *PrefixWriter) Prefixed(prefix string) WriterFlusher {
 	writer.mu.Lock()
 	writer.prefixlen = max(writer.prefixlen, len(prefix))
 	writer.mu.Unlock()
@ -75,6 +81,11 @@ func (writer *PrefixWriter) Write(data []byte) (int, error) {
 	return writer.root.Write(data)
 }
 // Flush any pending content.
 func (writer *PrefixWriter) Flush() error {
 	return writer.root.Flush()
 }
 // Write implements io.Writer that prefixes lines.
 func (writer *prefixWriter) Write(data []byte) (int, error) {
 	if len(data) == 0 {
@ -175,3 +186,70 @@ func (writer *prefixWriter) Write(data []byte) (int, error) {
 	return len(data), nil
 }
 // Flush flushes any pending data.
 func (writer *prefixWriter) Flush() error {
 	writer.local.Lock()
 	defer writer.local.Unlock()
 	buffer := writer.buffer
 	writer.buffer = nil
 	if len(buffer) == 0 {
 		return nil
 	}
 	writer.mu.Lock()
 	defer writer.mu.Unlock()
 	prefix := writer.prefix
 	id := writer.id
 	timeText := writer.nowFunc().Format(timeFormat)
 	for len(buffer) > 0 {
 		pos := bytes.IndexByte(buffer, '\n')
 		insertbreak := false
 		// did not find a linebreak
 		if pos < 0 {
 			pos = len(buffer)
 		}
 		// try to find a nice place where to break the line
 		if pos < 0 || pos > writer.maxline {
 			pos = writer.maxline - 1
 			for p := pos; p >= writer.maxline*2/3; p-- {
 				// is there a space we can break on?
 				if buffer[p] == ' ' {
 					pos = p
 					break
 				}
 			}
 			insertbreak = true
 		}
 		_, err := fmt.Fprintf(writer.dst, "%-*s %-*s %s | ", writer.prefixlen, prefix, maxIDLength, id, timeText)
 		if err != nil {
 			return err
 		}
 		_, err = writer.dst.Write(buffer[:pos])
 		buffer = buffer[pos:]
 		if err != nil {
 			return err
 		}
 		_, err = writer.dst.Write([]byte{'\n'})
 		if err != nil {
 			return err
 		}
 		// remove the linebreak from buffer, if it's not an insert
 		if !insertbreak && len(buffer) > 0 {
 			buffer = buffer[1:]
 		}
 		prefix = ""
 		id = ""
 		timeText = emptyTimeField
 	}
 	return nil
 }
--- a/cmd/storj-sim/prefix_test.go
+++ b/cmd/storj-sim/prefix_test.go
@ -17,7 +17,9 @@ import (
 func TestPrefixWriter(t *testing.T) {
 	root := NewPrefixWriter("", storjSimMaxLineLen, ioutil.Discard)
 	alpha := root.Prefixed("alpha")
 	defer func() { _ = alpha.Flush() }()
 	beta := root.Prefixed("beta")
 	defer func() { _ = beta.Flush() }()
 	var group errgroup.Group
 	defer func() {
--- a/cmd/storj-sim/process.go
+++ b/cmd/storj-sim/process.go
@ -5,6 +5,7 @@ package main
 import (
 	"context"
 	"errors"
 	"fmt"
 	"io"
 	"net"
@ -50,6 +51,8 @@ func NewProcesses(dir string, failfast bool) *Processes {
 // Exec executes a command on all processes.
 func (processes *Processes) Exec(ctx context.Context, command string) error {
 	defer func() { _ = processes.Output.Flush() }()
 	var group *errgroup.Group
 	if processes.FailFast {
 		group, ctx = errgroup.WithContext(ctx)
@ -65,7 +68,14 @@ func (processes *Processes) Start(ctx context.Context, group *errgroup.Group, co
 	for _, p := range processes.List {
 		process := p
 		group.Go(func() error {
-			return process.Exec(ctx, command)
+			err := process.Exec(ctx, command)
 			if errors.Is(err, context.Canceled) {
 				err = nil
 			}
 			if err != nil {
 				err = fmt.Errorf("%v failed: %w", process.Name, err)
 			}
 			return err
 		})
 	}
 }
@ -81,6 +91,8 @@ func (processes *Processes) Env() []string {
 // Close closes all the processes and their resources.
 func (processes *Processes) Close() error {
 	defer func() { _ = processes.Output.Flush() }()
 	var errlist errs.Group
 	for _, process := range processes.List {
 		errlist.Add(process.Close())
@ -168,8 +180,8 @@ type Process struct {
 	ExecBefore map[string]func(*Process) error
 	Arguments  Arguments
-	stdout io.Writer
+	stdout WriterFlusher
-	stderr io.Writer
+	stderr WriterFlusher
 }
 // New creates a process which can be run in the specified directory.
@ -203,6 +215,9 @@ func (process *Process) WaitForExited(dependency *Process) {
 // Exec runs the process using the arguments for a given command.
 func (process *Process) Exec(ctx context.Context, command string) (err error) {
 	defer func() { _ = process.stdout.Flush() }()
 	defer func() { _ = process.stderr.Flush() }()
 	// ensure that we always release all status fences
 	defer process.Status.Started.Release()
 	defer process.Status.Exited.Release()
@ -213,20 +228,20 @@ func (process *Process) Exec(ctx context.Context, command string) (err error) {
 	// wait for dependencies to start
 	for _, fence := range process.Wait {
 		if !fence.Wait(ctx) {
-			return ctx.Err()
+			return fmt.Errorf("waiting dependencies: %w", ctx.Err())
 		}
 	}
 	// in case we have an explicit delay then sleep
 	if process.Delay > 0 {
 		if !sync2.Sleep(ctx, process.Delay) {
-			return ctx.Err()
+			return fmt.Errorf("waiting for delay: %w", ctx.Err())
 		}
 	}
 	if exec, ok := process.ExecBefore[command]; ok {
 		if err := exec(process); err != nil {
-			return err
+			return fmt.Errorf("executing pre-actions: %w", err)
 		}
 	}
@ -275,7 +290,7 @@ func (process *Process) Exec(ctx context.Context, command string) (err error) {
 	if printCommands {
 		fmt.Fprintf(process.processes.Output, "%s running: %v\n", process.Name, strings.Join(cmd.Args, " "))
 		defer func() {
-			fmt.Fprintf(process.processes.Output, "%s exited: %v\n", process.Name, err)
+			fmt.Fprintf(process.processes.Output, "%s exited (code:%d): %v\n", process.Name, cmd.ProcessState.ExitCode(), err)
 		}()
 	}
@ -304,13 +319,17 @@ func (process *Process) Exec(ctx context.Context, command string) (err error) {
 	// wait for process completion
 	err = cmd.Wait()
-
+	if errors.Is(err, context.Canceled) && ctx.Err() != nil {
 		// Ignore error caused by context cancellation.
 		err = nil
 	}
 	// clear the error if the process was killed
 	if status, ok := cmd.ProcessState.Sys().(syscall.WaitStatus); ok {
 		if status.Signaled() && status.Signal() == os.Kill {
 			err = nil
 		}
 	}
 	return err
 }