argoproj · sarabala1979 · Mar 18, 2019 · Mar 14, 2019 · Mar 14, 2019 · Mar 14, 2019
diff --git a/cmd/argo/commands/get.go b/cmd/argo/commands/get.go
@@ -8,6 +8,9 @@ import (
  "strings"
  "text/tabwriter"
 
+ "github.com/argoproj/argo/errors"
+ "github.com/argoproj/argo/workflow/util/file"
+
  "github.com/argoproj/pkg/humanize"
  "github.com/ghodss/yaml"
  "github.com/spf13/cobra"
@@ -36,6 +39,10 @@ func NewGetCommand() *cobra.Command {
  if err != nil {
  log.Fatal(err)
  }
+ err = CheckAndDecompress(wf)
+ if err != nil {
+ log.Fatal(err)
+ }
  printWorkflow(wf, output)
  },
  }
@@ -45,6 +52,22 @@ func NewGetCommand() *cobra.Command {
  return command
 }
 
+func CheckAndDecompress(wf *wfv1.Workflow) error {
+ if wf.Status.CompressedNodes != "" {
+ nodeContent, err := file.DecodeDecompressString(wf.Status.CompressedNodes)
+ if err != nil {
+ return errors.InternalWrapError(err)
+ }
+ err = json.Unmarshal([]byte(nodeContent), &wf.Status.Nodes)
+ if err != nil {
+ log.Fatal(err)
+ return err
+ }
+ wf.Status.CompressedNodes = ""
+ }
+ return nil
+}
+
 func printWorkflow(wf *wfv1.Workflow, outFmt string) {
  switch outFmt {
  case "name":

diff --git a/cmd/argo/commands/watch.go b/cmd/argo/commands/watch.go
@@ -45,6 +45,8 @@ func watchWorkflow(name string) {
  select {
  case next := <-watchIf.ResultChan():
  wf, _ = next.Object.(*wfv1.Workflow)
+ err := CheckAndDecompress(wf)
+ errors.CheckError(err)
  case <-ticker.C:
  }
  if wf == nil {

diff --git a/pkg/apis/workflow/v1alpha1/types.go b/pkg/apis/workflow/v1alpha1/types.go
@@ -477,6 +477,8 @@ type WorkflowStatus struct {
  // A human readable message indicating details about why the workflow is in this condition.
  Message string `json:"message,omitempty"`
 
+ CompressedNodes string `json:"compressedNodes,omitempty"`
+
  // Nodes is a mapping between a node ID and the node's status.
  Nodes map[string]NodeStatus `json:"nodes,omitempty"`
 

diff --git a/test/e2e/stress/pod-limits.yaml b/test/e2e/stress/pod-limits.yaml
@@ -1,4 +1,4 @@
-# Stress test to test upper bounds of concurrent pods
+Stress test to test upper bounds of concurrent pods
 apiVersion: argoproj.io/v1alpha1
 kind: Workflow
 metadata:
@@ -7,19 +7,39 @@ spec:
  entrypoint: pod-limits
  arguments:
  parameters:
- - name: limit
- value: 1000
+  - name: limit
+  value: 1000
 
  templates:
- - name: pod-limits
- steps:
- - - name: run-pod
- template: run-pod
- withSequence:
- count: "{{workflow.parameters.limit}}"
+ - name: pod-limits
+ inputs:
+ parameters:
+ - name: limit
+ steps:
+ - - name: gen-number-list
+ template: gen-number-list
+ arguments:
+ parameters:
+ - name: count
+ value: "{{inputs.parameters.limit}}"
+ - - name: run-pod
+ template: run-pod
+ withParam: "{{steps.gen-number-list.outputs.result}}"
 
- - name: run-pod
- container:
- image: "alpine:3.7"
- command: [sh, -c]
- args: ["echo sleeping 1s; sleep 1"]
+ - name: gen-number-list
+ inputs:
+ parameters:
+ - name: count
+ script:
+ image: python:alpine3.6
+ command: [python]
+ source: |
+ import json
+ import sys
+ json.dump([i for i in range(1, {{inputs.parameters.count}}+1)], sys.stdout)
+ withSequence:
+ count: "{{workflow.parameters.limit}}"
+
+ - name: run-pod
+ container:
+ image: "alpine:3.7"
diff --git a/workflow/controller/controller.go b/workflow/controller/controller.go
@@ -243,6 +243,16 @@ func (wfc *WorkflowController) processNextItem() bool {
  }
 
  woc := newWorkflowOperationCtx(wf, wfc)
+ //Decompress the node if it is compressed
+
+ err = woc.checkAndDecompress()
+ if err != nil {
+ log.Warnf("Failed to decompress '%s' to workflow object: %v", key, err)
+ woc.markWorkflowFailed(fmt.Sprintf("invalid spec: %s", err.Error()))
+ woc.persistUpdates()
+ wfc.throttler.Remove(key)
+ return true
+ }
  woc.operate()
  if woc.wf.Status.Completed() {
  wfc.throttler.Remove(key)

diff --git a/workflow/controller/operator.go b/workflow/controller/operator.go
@@ -11,6 +11,8 @@ import (
  "strings"
  "time"
 
+ "github.com/argoproj/argo/workflow/util/file"
+
  argokubeerr "github.com/argoproj/pkg/kube/errors"
  "github.com/argoproj/pkg/strftime"
  jsonpatch "github.com/evanphx/json-patch"
@@ -72,6 +74,9 @@ var (
 // for before requeuing the workflow onto the workqueue.
 const maxOperationTime time.Duration = 10 * time.Second
 
+//maxWorkflowSize is the maximum size for workflow.yaml
+const maxWorkflowSize int = 1024 * 1024
+
 // newWorkflowOperationCtx creates and initializes a new wfOperationCtx object.
 func newWorkflowOperationCtx(wf *wfv1.Workflow, wfc *WorkflowController) *wfOperationCtx {
  // NEVER modify objects from the store. It's a read-only, local cache.
@@ -275,14 +280,24 @@ func (woc *wfOperationCtx) persistUpdates() {
  return
  }
  wfClient := woc.controller.wfclientset.ArgoprojV1alpha1().Workflows(woc.wf.ObjectMeta.Namespace)
+ woc.log.Info("Final size", woc.getSize())
+ if woc.wf.Status.CompressedNodes != "" {
+
+ err := woc.checkAndCompress()
+ if err != nil {
+ woc.log.Warnf("Error compressing workflow: %v", err)
+ }
+ woc.clearNodeStatusMap()
+ }
+
  _, err := wfClient.Update(woc.wf)
  if err != nil {
- woc.log.Warnf("Error updating workflow: %v", err)
+ woc.log.Warnf("Error updating workflow: %v %s", err, apierr.ReasonForError(err))
  if argokubeerr.IsRequestEntityTooLargeErr(err) {
  woc.persistWorkflowSizeLimitErr(wfClient, err)
  return
  }
- if !apierr.IsConflict(err) {
+ if err != nil && !apierr.IsConflict(err) {
  return
  }
  woc.log.Info("Re-appying updates on latest version and retrying update")
@@ -450,11 +465,32 @@ func (woc *wfOperationCtx) podReconciliation() error {
  }
 
  for _, pod := range podList.Items {
+ origNodeStatus := *woc.wf.Status.DeepCopy()
  performAssessment(&pod)
  err = woc.applyExecutionControl(&pod)
  if err != nil {
  woc.log.Warnf("Failed to apply execution control to pod %s", pod.Name)
  }
+ err = woc.checkAndCompress()
+ if err != nil {
+ woc.wf.Status = origNodeStatus
+ nodeNameForPod := pod.Annotations[common.AnnotationKeyNodeName]
+ nodeID := woc.wf.NodeID(nodeNameForPod)
+ node := woc.wf.Status.Nodes[nodeID]
+ node.Message = fmt.Sprintf("%v", err)
+ woc.log.Warn(node.Message)
+ node.Outputs = nil
+ node.FinishedAt = metav1.Time{Time: time.Now().UTC()}
+ node.Phase = wfv1.NodeError
+ node.Completed()
+ woc.wf.Status.Nodes[nodeID] = node
+ woc.updated = true
+ err = woc.checkAndCompress()
+ if err != nil {
+ woc.markWorkflowError(err, true)
+ }
+ }
+
  }
 
  // Now check for deleted pods. Iterate our nodes. If any one of our nodes does not show up in
@@ -1576,3 +1612,66 @@ func expandSequence(seq *wfv1.Sequence) ([]wfv1.Item, error) {
  }
  return items, nil
 }
+
+// getSize return the entire workflow json string size
+func (woc *wfOperationCtx) getSize() int {
+ nodeContent, err := json.Marshal(woc.wf)
+ if err != nil {
+ return -1
+ }
+
+ compressNodeSize := len(woc.wf.Status.CompressedNodes)
+
+ if compressNodeSize > 0 {
+ nodeStatus, err := json.Marshal(woc.wf.Status.Nodes)
+ if err != nil {
+ return -1
+ }
+ return len(nodeContent) - len(nodeStatus)
+ }
+ return len(nodeContent)
+}
+
+//checkAndCompress will check the workflow size and compress node status if total workflow size is more than maxWorkflowSize.
+//The compressed content will be assign to compressedNodes element and clear the nodestatus map.
+func (woc *wfOperationCtx) checkAndCompress() error {
+
+ if woc.wf.Status.CompressedNodes != "" || (woc.wf.Status.CompressedNodes == "" && woc.getSize() >= maxWorkflowSize) {
+
+ nodeContent, err := json.Marshal(woc.wf.Status.Nodes)
+ if err != nil {
+ return errors.InternalWrapError(err)
+ }
+ buff := string(nodeContent)
+ woc.wf.Status.CompressedNodes = file.CompressEncodeString(buff)
+
+ }
+ if woc.wf.Status.CompressedNodes != "" && woc.getSize() >= maxWorkflowSize {
+ return errors.InternalError(fmt.Sprintf("Workflow is longer than maximum allowed size. Size=%d", woc.getSize()))
+ }
+ return nil
+}
+
+func (woc *wfOperationCtx) clearNodeStatusMap() {
+ for k := range woc.wf.Status.Nodes {
+ delete(woc.wf.Status.Nodes, k)
+ }
+}
+
+//checkAndDecompress will decompress the compressednode and assign to workflow.status.nodes map.
+func (woc *wfOperationCtx) checkAndDecompress() error {
+ if woc.wf.Status.CompressedNodes != "" {
+ nodeContent, err := file.DecodeDecompressString(woc.wf.Status.CompressedNodes)
+ if err != nil {
+ return errors.InternalWrapError(err)
+ }
+ var tempNodes map[string]wfv1.NodeStatus
+
+ err = json.Unmarshal([]byte(nodeContent), &tempNodes)
+ if err != nil {
+ woc.log.Warn(err)
+ }
+ woc.wf.Status.Nodes = tempNodes
+ }
+ return nil
+}
diff --git a/workflow/util/file/fileutil.go b/workflow/util/file/fileutil.go
@@ -2,8 +2,11 @@ package file
 
 import (
  "archive/tar"
+ "bytes"
  "compress/gzip"
+ "encoding/base64"
  "io"
+ "io/ioutil"
  "os"
  "strings"
 
@@ -18,7 +21,7 @@ func IsFileOrDirExistInGZip(sourcePath string, gzipFilePath string) bool {
  if os.IsNotExist(err) {
  return false
  }
- defer closeFile(fi)
+ defer close(fi)
 
  fz, err := gzip.NewReader(fi)
  if err != nil {
@@ -44,9 +47,64 @@ func IsFileOrDirExistInGZip(sourcePath string, gzipFilePath string) bool {
  return false
 }
 
-func closeFile(f *os.File) {
+//Close the file
+func close(f io.Closer) {
  err := f.Close()
  if err != nil {
- log.Warn("Failed to close the file. v%", err)
+ log.Warn("Failed to close the file/writer/reader. ", err)
  }
 }
+
+//EncodeContent will encode using base64
+func EncodeContent(content []byte) string {
+ encoder := base64.StdEncoding
+ return encoder.EncodeToString(content)
+
+}
+
+//DecodeContent will decode using base64
+func DecodeContent(content string) ([]byte, error) {
+ encoder := base64.StdEncoding
+ return encoder.DecodeString(content)
+}
+
+//CompressEncodeString will return the compressed string with base64 encoded
+func CompressEncodeString(content string) string {
+ return EncodeContent(CompressContent([]byte(content)))
+}
+
+//DecodeDecompressString will return decode and decompress the
+func DecodeDecompressString(content string) (string, error) {
+
+ buf, err := DecodeContent(content)
+ if err != nil {
+ return "", err
+ }
+ dBuf, err := DecompressContent(buf)
+ if err != nil {
+ return "", err
+ }
+ return string(dBuf), nil
+}
+
+//CompressContent will compress the byte array using zip writer
+func CompressContent(content []byte) []byte {
+ var buf bytes.Buffer
+ zipWriter := gzip.NewWriter(&buf)
+
+ _, err := zipWriter.Write(content)
+ if err != nil {
+ log.Warn("Error in compressing. v%", err)
+ }
+ close(zipWriter)
+ return buf.Bytes()
+}
+
+//D
+func DecompressContent(content []byte) ([]byte, error) {
+
+ buf := bytes.NewReader(content)
+ gZipReader, _ := gzip.NewReader(buf)
+ defer close(gZipReader)
+ return ioutil.ReadAll(gZipReader)
+}