argoproj · jessesuen · Nov 2, 2018 · Oct 15, 2018 · Oct 16, 2018 · Oct 16, 2018
diff --git a/workflow/controller/dag.go b/workflow/controller/dag.go
@@ -308,7 +308,7 @@ func (woc *wfOperationCtx) executeDAGTask(dagCtx *dagContext, taskName string) {
 			}
 		}
 		// Finally execute the template
-		_, _ = woc.executeTemplate(t.Template, t.Arguments, taskNodeName, dagCtx.boundaryID)
+		_, _ = woc.executeTemplate(t.Template, t.Arguments, taskNodeName, dagCtx.boundaryID, dagCtx.boundaryName)
 	}
 
 	// If we expanded the task, we still need to create the task entry for the non-expanded node,

diff --git a/workflow/controller/operator.go b/workflow/controller/operator.go
@@ -152,7 +152,7 @@ func (woc *wfOperationCtx) operate() {
 	}
 	var workflowStatus wfv1.NodePhase
 	var workflowMessage string
-	node, _ := woc.executeTemplate(woc.wf.Spec.Entrypoint, woc.wf.Spec.Arguments, woc.wf.ObjectMeta.Name, "")
+	node, _ := woc.executeTemplate(woc.wf.Spec.Entrypoint, woc.wf.Spec.Arguments, woc.wf.ObjectMeta.Name, "", "")
 	if node == nil || !node.Completed() {
 		// node can be nil if a workflow created immediately in a parallelism == 0 state
 		return
@@ -175,7 +175,7 @@ func (woc *wfOperationCtx) operate() {
 		}
 		woc.log.Infof("Running OnExit handler: %s", woc.wf.Spec.OnExit)
 		onExitNodeName := woc.wf.ObjectMeta.Name + ".onExit"
-		onExitNode, _ = woc.executeTemplate(woc.wf.Spec.OnExit, woc.wf.Spec.Arguments, onExitNodeName, "")
+		onExitNode, _ = woc.executeTemplate(woc.wf.Spec.OnExit, woc.wf.Spec.Arguments, onExitNodeName, "", "")
 		if onExitNode == nil || !onExitNode.Completed() {
 			return
 		}
@@ -495,6 +495,27 @@ func (woc *wfOperationCtx) countActivePods(boundaryIDs ...string) int64 {
 	return activePods
 }
 
+// countActiveChildren counts the number of active (Pending/Running) children nodes of parent parentName
+func (woc *wfOperationCtx) countActiveChildren(parentName string) int64 {
+	parent := woc.getNodeByName(parentName)
+	if parent == nil {
+		return 0
+	}
+	var activeChildren int64
+	// if we care about parallelism, count the active children nodes at the template level
+	for _, c := range parent.Children {
+		node, ok := woc.wf.Status.Nodes[c]
+		if !ok {
+			continue
+		}
+		switch node.Phase {
+		case wfv1.NodePending, wfv1.NodeRunning:
+			activeChildren++
+		}
+	}
+	return activeChildren
+}
+
 // getAllWorkflowPods returns all pods related to the current workflow
 func (woc *wfOperationCtx) getAllWorkflowPods() (*apiv1.PodList, error) {
 	options := metav1.ListOptions{
@@ -866,8 +887,9 @@ func (woc *wfOperationCtx) getLastChildNode(node *wfv1.NodeStatus) (*wfv1.NodeSt
 // for the created node (if created). Nodes may not be created if parallelism or deadline exceeded.
 // nodeName is the name to be used as the name of the node, and boundaryID indicates which template
 // boundary this node belongs to.
-func (woc *wfOperationCtx) executeTemplate(templateName string, args wfv1.Arguments, nodeName string, boundaryID string) (*wfv1.NodeStatus, error) {
-	woc.log.Debugf("Evaluating node %s: template: %s", nodeName, templateName)
+func (woc *wfOperationCtx) executeTemplate(templateName string, args wfv1.Arguments, nodeName string, boundaryID string, parentName string) (*wfv1.NodeStatus, error) {
+	woc.log.Debugf("Evaluating node %s: template: %s, boundaryID: %s, parentName: %s", nodeName, templateName, boundaryID, parentName)
+
 	node := woc.getNodeByName(nodeName)
 	if node != nil && node.Completed() {
 		woc.log.Debugf("Node %s already completed", nodeName)
@@ -887,7 +909,7 @@ func (woc *wfOperationCtx) executeTemplate(templateName string, args wfv1.Argume
 		err := errors.Errorf(errors.CodeBadRequest, "Node %v error: template '%s' undefined", node, templateName)
 		return woc.initializeNode(nodeName, wfv1.NodeTypeSkipped, "", boundaryID, wfv1.NodeError, err.Error()), err
 	}
-	if err := woc.checkParallelism(tmpl, node, boundaryID); err != nil {
+	if err := woc.checkParallelism(tmpl, node, boundaryID, parentName); err != nil {
 		return node, err
 	}
 
@@ -1096,11 +1118,13 @@ func (woc *wfOperationCtx) markNodeError(nodeName string, err error) *wfv1.NodeS
 }
 
 // checkParallelism checks if the given template is able to be executed, considering the current active pods and workflow/template parallelism
-func (woc *wfOperationCtx) checkParallelism(tmpl *wfv1.Template, node *wfv1.NodeStatus, boundaryID string) error {
+func (woc *wfOperationCtx) checkParallelism(tmpl *wfv1.Template, node *wfv1.NodeStatus, boundaryID string, parentName string) error {
+	woc.log.Infof("tmpl type: %v, parallelism:%v, node:%v", tmpl.GetType(), tmpl.Parallelism, node)
 	if woc.wf.Spec.Parallelism != nil && woc.activePods >= *woc.wf.Spec.Parallelism {
 		woc.log.Infof("workflow active pod spec parallelism reached %d/%d", woc.activePods, *woc.wf.Spec.Parallelism)
 		return ErrParallelismReached
 	}
+
 	// TODO: repeated calls to countActivePods is not optimal
 	switch tmpl.GetType() {
 	case wfv1.TemplateTypeDAG, wfv1.TemplateTypeSteps:
@@ -1112,6 +1136,24 @@ func (woc *wfOperationCtx) checkParallelism(tmpl *wfv1.Template, node *wfv1.Node
 				return ErrParallelismReached
 			}
 		}
+
+		// if we are about to start executing a StepGroup, make our parent hasn't reached it's limit
+		// only when it is not started yet, i.e. let it keep running if it has started
+		if boundaryID != "" && (node == nil || (node.Phase != wfv1.NodePending && node.Phase != wfv1.NodeRunning)) {
+			boundaryNode := woc.wf.Status.Nodes[boundaryID]
+			boundaryTemplate := woc.wf.GetTemplate(boundaryNode.TemplateName)
+			if boundaryTemplate.Parallelism != nil {
+				// for stepgroups, parent is different from boundary
+				activeSiblings := woc.countActiveChildren(parentName)
+
+				woc.log.Debugf("counted %d/%d active children in boundary %s of parent %s", activeSiblings, *boundaryTemplate.Parallelism, boundaryID, parentName)
+				if activeSiblings >= *boundaryTemplate.Parallelism {
+					woc.log.Infof("template (node %s) active pod parallelism reached %d/%d", boundaryID, activeSiblings, *boundaryTemplate.Parallelism)
+					return ErrParallelismReached
+				}
+			}
+		}
+
 	default:
 		// if we are about to execute a pod, make our parent hasn't reached it's limit
 		if boundaryID != "" {

diff --git a/workflow/controller/steps.go b/workflow/controller/steps.go
@@ -187,7 +187,7 @@ func (woc *wfOperationCtx) executeStepGroup(stepGroup []wfv1.WorkflowStep, sgNod
 			}
 			continue
 		}
-		childNode, err := woc.executeTemplate(step.Template, step.Arguments, childNodeName, stepsCtx.boundaryID)
+		childNode, err := woc.executeTemplate(step.Template, step.Arguments, childNodeName, stepsCtx.boundaryID, sgNodeName)
 		if err != nil {
 			switch err {
 			case ErrDeadlineExceeded: