add no pod events yet callback

add lock to avoid data race on Out stream used for logging
gabemontero · Oct 12, 2021 · 9ba2e51 · 9ba2e51
1 parent d80f348
commit 9ba2e51
Show file tree

Hide file tree

Showing 3 changed files with 72 additions and 17 deletions.
diff --git a/pkg/shp/cmd/build/run.go b/pkg/shp/cmd/build/run.go
@@ -3,6 +3,7 @@ package build
 import (
  "errors"
  "fmt"
+ "sync"
  "time"
 
  buildv1alpha1 "github.com/shipwright-io/build/pkg/apis/build/v1alpha1"
@@ -31,8 +32,11 @@ type RunCommand struct {
  logTail *tail.Tail // follow container logs
  tailLogsStarted map[string]bool // controls tail instance per container
 
- buildName string // build name
+ logLock sync.Mutex
+
+ buildName string
  buildRunName string
+ namespace string
  buildRunSpec *buildv1alpha1.BuildRunSpec // stores command-line flags
  shpClientset buildclientset.Interface
  follow bool // flag to tail pod logs
@@ -65,6 +69,7 @@ func (r *RunCommand) Complete(params *params.Params, io *genericclioptions.IOStr
  }
  r.logTail = tail.NewTail(r.Cmd().Context(), clientset)
  r.ioStreams = io
+ r.namespace = params.Namespace()
  if r.follow {
  if r.shpClientset, err = params.ShipwrightClientSet(); err != nil {
  return err
@@ -85,6 +90,7 @@ func (r *RunCommand) Complete(params *params.Params, io *genericclioptions.IOStr
 
  r.pw.WithOnPodModifiedFn(r.onEvent)
  r.pw.WithTimeoutPodFn(r.onTimeout)
+ r.pw.WithNoPodEventsYetFn(r.onNoPodEventsYet)
 
  }
 
@@ -113,9 +119,45 @@ func (r *RunCommand) tailLogs(pod *corev1.Pod) {
  }
 }
 
+// onNoPodEventsYet reacts to the pod watcher telling us it has not received any pod events for our build run
+func (r *RunCommand) onNoPodEventsYet() {
+ r.Log(fmt.Sprintf("BuildRun %q log following has not observed any pod events yet.", r.buildRunName))
+ br, err := r.shpClientset.ShipwrightV1alpha1().BuildRuns(r.namespace).Get(r.cmd.Context(), r.buildRunName, metav1.GetOptions{})
+ if err != nil {
+ r.Log(fmt.Sprintf("error accessing BuildRun %q: %s", r.buildRunName, err.Error()))
+ return
+ }
+
+ c := br.Status.GetCondition(buildv1alpha1.Succeeded)
+ giveUp := false
+ msg := ""
+ switch {
+ case c != nil && c.Status == corev1.ConditionTrue:
+ giveUp = true
+ msg = fmt.Sprintf("BuildRun '%s' has been marked as successful.\n", br.Name)
+ case c != nil && c.Status == corev1.ConditionFalse:
+ giveUp = true
+ msg = fmt.Sprintf("BuildRun '%s' has been marked as failed.\n", br.Name)
+ case br.IsCanceled():
+ giveUp = true
+ msg = fmt.Sprintf("BuildRun '%s' has been canceled.\n", br.Name)
+ case br.DeletionTimestamp != nil:
+ giveUp = true
+ msg = fmt.Sprintf("BuildRun '%s' has been deleted.\n", br.Name)
+ case !br.HasStarted():
+ r.Log(fmt.Sprintf("BuildRun '%s' has been marked as failed.\n", br.Name))
+ }
+ if giveUp {
+ r.Log(msg)
+ r.Log(fmt.Sprintf("exiting 'ship build run --follow' for BuildRun %q", br.Name))
+ r.stop()
+ }
+
+}
+
 // onTimeout reacts to either the context or request timeout causing the pod watcher to exit
 func (r *RunCommand) onTimeout(msg string) {
- fmt.Fprintf(r.ioStreams.Out, "BuildRun %q log following has stopped because: %q\n", r.buildRunName, msg)
+ r.Log(fmt.Sprintf("BuildRun %q log following has stopped because: %q\n", r.buildRunName, msg))
 }
 
 // onEvent reacts on pod state changes, to start and stop tailing container logs.
@@ -141,14 +183,14 @@ func (r *RunCommand) onEvent(pod *corev1.Pod) error {
  err = fmt.Errorf("build pod '%s' has failed", pod.GetName())
  }
  // see if because of deletion or cancelation
- fmt.Fprintf(r.ioStreams.Out, msg)
+ r.Log(msg)
  r.stop()
  return err
  case corev1.PodSucceeded:
- fmt.Fprintf(r.ioStreams.Out, "Pod '%s' has succeeded!\n", pod.GetName())
+ r.Log(fmt.Sprintf("Pod '%s' has succeeded!\n", pod.GetName()))
  r.stop()
  default:
- fmt.Fprintf(r.ioStreams.Out, "Pod '%s' is in state %q...\n", pod.GetName(), string(pod.Status.Phase))
+ r.Log(fmt.Sprintf("Pod '%s' is in state %q...\n", pod.GetName(), string(pod.Status.Phase)))
  // handle any issues with pulling images that may fail
  for _, c := range pod.Status.Conditions {
  if c.Type == corev1.PodInitialized || c.Type == corev1.ContainersReady {
@@ -182,7 +224,7 @@ func (r *RunCommand) Run(params *params.Params, ioStreams *genericclioptions.IOS
  if err != nil {
  return err
  }
- br, err = clientset.ShipwrightV1alpha1().BuildRuns(params.Namespace()).Create(r.cmd.Context(), br, metav1.CreateOptions{})
+ br, err = clientset.ShipwrightV1alpha1().BuildRuns(r.namespace).Create(r.cmd.Context(), br, metav1.CreateOptions{})
  if err != nil {
  return err
  }
@@ -202,12 +244,17 @@ func (r *RunCommand) Run(params *params.Params, ioStreams *genericclioptions.IOS
  r.buildName,
  br.GetName(),
  )}
- r.pw.WithOnPodModifiedFn(r.onEvent)
- r.pw.WithTimeoutPodFn(r.onTimeout)
  _, err = r.pw.Start(listOpts)
  return err
 }
 
+func (r *RunCommand) Log(msg string) {
+ // concurrent fmt.Fprintf(r.ioStream.Out...) calls need locking to avoid data races, as we 'write' to the stream
+ r.logLock.Lock()
+ defer r.logLock.Unlock()
+ fmt.Fprintf(r.ioStreams.Out, msg)
+}
+
 // runCmd instantiate the "build run" sub-command using common BuildRun flags.
 func runCmd() runner.SubCommand {
  cmd := &cobra.Command{
@@ -219,6 +266,7 @@ func runCmd() runner.SubCommand {
  cmd: cmd,
  buildRunSpec: flags.BuildRunSpecFromFlags(cmd.Flags()),
  tailLogsStarted: make(map[string]bool),
+ logLock: sync.Mutex{},
  }
  cmd.Flags().BoolVarP(&runCommand.follow, "follow", "F", runCommand.follow, "Start a build and watch its log until it completes or fails.")
  return runCommand

diff --git a/pkg/shp/cmd/build/run_test.go b/pkg/shp/cmd/build/run_test.go
@@ -1,7 +1,9 @@
 package build
 
 import (
+ "bytes"
  "strings"
+ "sync"
  "testing"
 
  buildv1alpha1 "github.com/shipwright-io/build/pkg/apis/build/v1alpha1"
@@ -129,6 +131,7 @@ func TestStartBuildRunFollowLog(t *testing.T) {
  follow: true,
  shpClientset: shpclientset,
  tailLogsStarted: make(map[string]bool),
+ logLock: sync.Mutex{},
  }
 
  // set up context
@@ -153,9 +156,7 @@ func TestStartBuildRunFollowLog(t *testing.T) {
  cmd.Complete(param, &ioStreams, []string{name})
  if len(test.to) > 0 {
  cmd.Run(param, &ioStreams)
- if !strings.Contains(out.String(), test.logText) {
- t.Errorf("test %s: unexpected output: %s", test.name, out.String())
- }
+ checkLog(test.name, test.logText, cmd, out, t)
  continue
  }
  go func() {
@@ -169,9 +170,15 @@ func TestStartBuildRunFollowLog(t *testing.T) {
  // mimic watch events, bypassing k8s fake client watch hoopla whose plug points are not always useful;
  pod.Status.Phase = test.phase
  cmd.onEvent(pod)
- if !strings.Contains(out.String(), test.logText) {
-  t.Errorf("test %s: unexpected output: %s", test.name, out.String())
- }
+ checkLog(test.name, test.logText, cmd, out, t)
+ }
+}
 
+func checkLog(name, text string, cmd *RunCommand, out *bytes.Buffer, t *testing.T) {
+ // need to employ log lock since accessing same iostream out used by Run cmd
+ cmd.logLock.Lock()
+ defer cmd.logLock.Unlock()
+ if !strings.Contains(out.String(), text) {
+ t.Errorf("test %s: unexpected output: %s", name, out.String())
  }
 }
diff --git a/pkg/shp/reactor/pod_watcher.go b/pkg/shp/reactor/pod_watcher.go
@@ -90,8 +90,8 @@ func (p *PodWatcher) WithNoPodEventsYetFn(fn NoPodEventsYetFn) *PodWatcher {
 
 // handleEvent applies user informed functions against informed pod and event.
 func (p *PodWatcher) handleEvent(pod *corev1.Pod, event watch.Event) error {
- p.stopLock.Lock()
- defer p.stopLock.Unlock()
+ //p.stopLock.Lock()
+ //defer p.stopLock.Unlock()
  p.eventTicker.Stop()
  switch event.Type {
  case watch.Added:
@@ -185,9 +185,9 @@ func (p *PodWatcher) Stop() {
  // along with canceling of builds
  p.stopLock.Lock()
  defer p.stopLock.Unlock()
+ p.eventTicker.Stop()
  if !p.stopped {
  close(p.stopCh)
- p.eventTicker.Stop()
  p.stopped = true
  }
 }