kagent-dev · jsonmp-k8 · Apr 24, 2026 · Apr 24, 2026 · Apr 24, 2026 · Apr 24, 2026
diff --git a/design/EP-991-workflow-subagents.md b/design/EP-991-workflow-subagents.md
@@ -0,0 +1,190 @@
+# EP-991: Declarative Workflow Subagents
+
+- Issue: [#991](https://github.com/kagent-dev/kagent/issues/991)
+
+## Background
+
+Google ADK provides three workflow agent primitives — `SequentialAgent`, `ParallelAgent`, and `LoopAgent` — that deterministically orchestrate in-process sub-agents. kagent currently supports agent-to-agent delegation via A2A tool references, but this is LLM-driven (the model decides when and whether to call sub-agents). There is no way to declare deterministic multi-agent workflows in YAML.
+
+This EP adds a `workflow` field to the `DeclarativeAgentSpec` CRD that lets users declare Sequential, Parallel, and Loop orchestration patterns. Sub-agents are defined inline within the parent agent's CRD and run in-process within the same pod, sharing session state.
+
+## Motivation
+
+Users building multi-agent systems need deterministic orchestration patterns:
+- **Sequential**: Run agents in a fixed order (e.g., writer → editor → publisher)
+- **Parallel**: Run agents concurrently and merge results (e.g., research multiple topics simultaneously)
+- **Loop**: Iterate until a condition is met (e.g., write → critique → refine cycles)
+
+Today, users must either rely on the LLM to coordinate agents (non-deterministic) or write custom BYO agents in code. Declarative workflow support brings these patterns to YAML-only users and ensures reliable execution order.
+
+### Goals
+
+1. Support `Sequential`, `Parallel`, and `Loop` workflow types via CRD configuration
+2. Sub-agents run in-process within a single pod, sharing session state
+3. Each sub-agent can have its own system message, model config, and MCP tools
+4. Loop workflows support `maxIterations` and exit-on-escalation
+5. Both Python and Go runtimes support workflow agents
+
+### Non-Goals
+
+1. Remote sub-agents (separate pods communicating via A2A within a workflow)
+2. Nested workflows (a sub-agent that is itself a workflow)
+3. Conditional branching or DAG-based orchestration beyond what ADK provides
+4. UI visualization of workflow topology
+
+## Implementation
+
+### 1. CRD Types (`go/api/v1alpha2/agent_types.go`)
+
+New types added to the agent CRD:
+
+```go
+// +kubebuilder:validation:Enum=Sequential;Parallel;Loop
+type WorkflowType string
+
+type WorkflowSpec struct {
+    Type          WorkflowType     `json:"type"`
+    SubAgents     []InlineAgentSpec `json:"subAgents"`
+    MaxIterations *int             `json:"maxIterations,omitempty"` // Loop only
+}
+
+type InlineAgentSpec struct {
+    Name          string  `json:"name"`
+    Description   string  `json:"description,omitempty"`
+    SystemMessage string  `json:"systemMessage"`
+    ModelConfig   string  `json:"modelConfig,omitempty"` // inherits parent if unset
+    Tools         []*Tool `json:"tools,omitempty"`       // MCP tools only
+}
+```
+
+The `Workflow` field is added to `DeclarativeAgentSpec` with CEL validation rules:
+- `workflow` is mutually exclusive with `systemMessage`, `systemMessageFrom`, and `tools`
+- `workflow` is mutually exclusive with `memory`, `context`, and `executeCodeBlocks`
+- `maxIterations` is only valid for `Loop` type; when unset, the loop runs indefinitely until a sub-agent escalates
+
+### 2. ADK Config Types (`go/api/adk/types.go`)
+
+JSON-serializable types passed to both Python and Go runtimes:
+
+```go
+type WorkflowAgentConfig struct {
+    Type          string           `json:"type"` // "sequential", "parallel", "loop"
+    SubAgents     []SubAgentConfig `json:"sub_agents"`
+    MaxIterations *int             `json:"max_iterations,omitempty"`
+}
+
+type SubAgentConfig struct {
+    Name        string                `json:"name"`
+    Description string                `json:"description,omitempty"`
+    Instruction string                `json:"instruction"`
+    Model       Model                 `json:"model"`
+    HttpTools   []HttpMcpServerConfig `json:"http_tools,omitempty"`
+    SseTools    []SseMcpServerConfig  `json:"sse_tools,omitempty"`
+}
+```
+
+The `AgentConfig` struct gets a new `Workflow *WorkflowAgentConfig` field.
+
+### 3. Translator Changes
+
+The translator's `translateInlineAgent` method branches when `Workflow` is set, calling a new `translateWorkflowAgent` method that:
+
+1. Resolves the default model config (used by sub-agents without their own)
+2. For each sub-agent: resolves its model (own or inherited), translates MCP tools
+3. Returns an `AgentConfig` with the `Workflow` field populated
+
+The `translateMCPServerTarget` method is refactored to support writing tool configs to `SubAgentConfig` in addition to `AgentConfig`.
+
+Validation rules enforced by the translator:
+- Sub-agent names must be unique within a workflow
+- Agent-as-tool references are not allowed within workflow sub-agents
+- `maxIterations` only meaningful for Loop type
+
+### 4. Python Runtime (`python/packages/kagent-adk/src/kagent/adk/types.py`)
+
+The `AgentConfig.to_agent()` method is refactored:
+- Existing logic moves to `_build_llm_agent()`
+- New `_build_workflow_agent()` constructs in-process sub-agents and wraps them in the appropriate ADK workflow agent
+
+```python
+from google.adk.agents import SequentialAgent, ParallelAgent, LoopAgent
+
+def _build_workflow_agent(self, name, sts_integration):
+    sub_agents = [self._build_sub_agent(cfg, sts_integration) for cfg in self.workflow.sub_agents]
+    match self.workflow.type:
+        case "sequential": return SequentialAgent(name=name, sub_agents=sub_agents, ...)
+        case "parallel":   return ParallelAgent(name=name, sub_agents=sub_agents, ...)
+        case "loop":       return LoopAgent(name=name, sub_agents=sub_agents, max_iterations=...)
+```
+
+### 5. Go Runtime (`go/adk/pkg/agent/agent.go`)
+
+New `CreateWorkflowAgent()` function creates sub-agents via `llmagent.New()` and wraps them in the appropriate workflow agent from `google.golang.org/adk/agent/workflowagents/`.
+
+The runner adapter (`go/adk/pkg/runner/adapter.go`) routes to `CreateWorkflowAgent()` when `agentConfig.Workflow != nil`.
+
+### Example: Sequential Workflow
+
+```yaml
+apiVersion: kagent.dev/v1alpha2
+kind: Agent
+metadata:
+  name: writer-critic
+spec:
+  type: Declarative
+  description: Generates content then reviews it
+  declarative:
+    runtime: python
+    modelConfig: default-model-config
+    workflow:
+      type: Sequential
+      subAgents:
+        - name: writer
+          description: Writes creative content
+          systemMessage: |
+            You are a creative writer. Write a compelling paragraph about the given topic.
+        - name: critic
+          description: Reviews and improves content
+          systemMessage: |
+            You are a writing critic. Review the previous content and provide improvements.
+```
+
+### Example: Loop Workflow
+
+```yaml
+apiVersion: kagent.dev/v1alpha2
+kind: Agent
+metadata:
+  name: iterative-refiner
+spec:
+  type: Declarative
+  description: Iteratively refines content through write-critique cycles
+  declarative:
+    modelConfig: default-model-config
+    workflow:
+      type: Loop
+      maxIterations: 5
+      subAgents:
+        - name: writer
+          systemMessage: Write or refine content based on feedback.
+        - name: critic
+          systemMessage: Critique the content. If satisfactory, escalate to stop the loop.
+```
+
+### Test Plan
+
+1. **Translator golden tests**: Input YAML + expected output JSON for sequential, parallel, and loop workflows
+2. **Python unit tests**: Verify `to_agent()` returns correct workflow agent type with correct sub-agent count and configuration
+3. **Go unit tests**: Verify `CreateWorkflowAgent()` for all three workflow types
+4. **CRD validation**: Verify CEL rules reject invalid combinations (workflow + systemMessage, maxIterations on non-Loop)
+
+## Alternatives
+
+**Remote sub-agents via A2A**: Each sub-agent as a separate Agent CR and pod. Rejected because ADK workflow agents require in-process sub-agents sharing session state. Remote A2A adds network latency and breaks session state sharing. The existing agent-as-tool pattern already covers the remote case.
+
+**Workflow as a separate CRD**: A dedicated `Workflow` resource type that references Agent CRs. Rejected for the same reason — ADK workflow agents need in-process sub-agents, not separate pods.
+
+## Open Questions
+
+1. Should sub-agents within a workflow be allowed to reference remote agents (other Agent CRs) as tools? Currently prohibited for simplicity; could be added later since the pod already has network access.
+2. Should nested workflows (a sub-agent that is itself a workflow) be supported? Deferred to a future EP.
@@ -14,6 +14,9 @@ import (
 	"github.com/kagent-dev/kagent/go/api/adk"
 	"google.golang.org/adk/agent"
 	"google.golang.org/adk/agent/llmagent"
+	"google.golang.org/adk/agent/workflowagents/loopagent"
+	"google.golang.org/adk/agent/workflowagents/parallelagent"
+	"google.golang.org/adk/agent/workflowagents/sequentialagent"
 	adkmodel "google.golang.org/adk/model"
 	adkgemini "google.golang.org/adk/model/gemini"
 	"google.golang.org/adk/tool"
@@ -37,6 +40,101 @@ func CreateGoogleADKAgent(ctx context.Context, agentConfig *adk.AgentConfig, age
 	return a, err
 }
 
+// CreateWorkflowAgent creates a workflow agent (Sequential, Parallel, or Loop)
+// from a config that contains a Workflow specification.
+func CreateWorkflowAgent(ctx context.Context, agentConfig *adk.AgentConfig, agentName string) (agent.Agent, error) {
+	if agentConfig == nil || agentConfig.Workflow == nil {
+		return nil, fmt.Errorf("agent config with workflow is required")
+	}
+
+	log := logr.FromContextOrDiscard(ctx)
+	workflow := agentConfig.Workflow
+
+	subAgents := make([]agent.Agent, 0, len(workflow.SubAgents))
+	for _, subAgentConfig := range workflow.SubAgents {
+		subAgent, err := createInProcessSubAgent(ctx, &subAgentConfig, log)
+		if err != nil {
+			return nil, fmt.Errorf("failed to create sub-agent %q: %w", subAgentConfig.Name, err)
+		}
+		subAgents = append(subAgents, subAgent)
+	}
+
+	baseConfig := agent.Config{
+		Name:        agentName,
+		Description: agentConfig.Description,
+		SubAgents:   subAgents,
+	}
+
+	switch workflow.Type {
+	case "sequential":
+		return sequentialagent.New(sequentialagent.Config{
+			AgentConfig: baseConfig,
+		})
+	case "parallel":
+		return parallelagent.New(parallelagent.Config{
+			AgentConfig: baseConfig,
+		})
+	case "loop":
+		loopConfig := loopagent.Config{
+			AgentConfig: baseConfig,
+		}
+		if workflow.MaxIterations != nil {
+			loopConfig.MaxIterations = uint(*workflow.MaxIterations)
+		}
+		return loopagent.New(loopConfig)
+	default:
+		return nil, fmt.Errorf("unknown workflow type: %s", workflow.Type)
+	}
+}
+
+// createInProcessSubAgent builds an in-process LLM agent from a SubAgentConfig.
+func createInProcessSubAgent(ctx context.Context, config *adk.SubAgentConfig, log logr.Logger) (agent.Agent, error) {
+	toolsets := mcp.CreateToolsets(ctx, config.HttpTools, config.SseTools)
+
+	llmModel, err := CreateLLM(ctx, config.Model, log)
+	if err != nil {
+		return nil, fmt.Errorf("failed to create LLM: %w", err)
+	}
+
+	// Collect tool names that require approval from MCP tools.
+	approvalSet := make(map[string]bool)
+	for _, httpTool := range config.HttpTools {
+		for _, name := range httpTool.RequireApproval {
+			approvalSet[name] = true
+		}
+	}
+	for _, sseTool := range config.SseTools {
+		for _, name := range sseTool.RequireApproval {
+			approvalSet[name] = true
+		}
+	}
+
+	beforeToolCallbacks := []llmagent.BeforeToolCallback{makeBeforeToolCallback(log)}
+	beforeModelCallbacks := []llmagent.BeforeModelCallback{}
+	if len(approvalSet) > 0 {
+		log.Info("Wiring approval callback for workflow sub-agent", "name", config.Name, "toolCount", len(approvalSet))
+		beforeToolCallbacks = append([]llmagent.BeforeToolCallback{MakeApprovalCallback(approvalSet)}, beforeToolCallbacks...)
+		beforeModelCallbacks = append(beforeModelCallbacks, MakeStripConfirmationPartsCallback())
+	}
+
+	return llmagent.New(llmagent.Config{
+		Name:                 config.Name,
+		Description:          config.Description,
+		Instruction:          config.Instruction,
+		Model:                llmModel,
+		Toolsets:             toolsets,
+		IncludeContents:      llmagent.IncludeContentsDefault,
+		BeforeToolCallbacks:  beforeToolCallbacks,
+		BeforeModelCallbacks: beforeModelCallbacks,
+		AfterToolCallbacks: []llmagent.AfterToolCallback{
+			makeAfterToolCallback(log),
+		},
+		OnToolErrorCallbacks: []llmagent.OnToolErrorCallback{
+			makeOnToolErrorCallback(log),
+		},
+	})
+}
+
 // CreateGoogleADKAgentWithSubagentSessionIDs creates a Google ADK agent and a
 // map of remote-subagent tool name → A2A context session ID (for stamping
 // outbound A2A events). Callers that only need the agent can use

@@ -9,6 +9,7 @@ import (
 	kagentmemory "github.com/kagent-dev/kagent/go/adk/pkg/memory"
 	"github.com/kagent-dev/kagent/go/adk/pkg/session"
 	"github.com/kagent-dev/kagent/go/api/adk"
+	adkagent "google.golang.org/adk/agent"
 	adkmemory "google.golang.org/adk/memory"
 	"google.golang.org/adk/runner"
 	adksession "google.golang.org/adk/session"
@@ -31,18 +32,32 @@ func CreateRunnerConfig(
 	appName string,
 	memoryService *kagentmemory.KagentMemoryService,
 ) (runner.Config, map[string]string, error) {
-	var extraTools []adktool.Tool
-	if memoryService != nil {
-		saveTool, err := kagentmemory.NewSaveMemoryTool(memoryService)
+	var adkAgent adkagent.Agent
+	var subagentSessionIDs map[string]string
+
+	if agentConfig.Workflow != nil {
+		// Workflow agents use a different creation path — no extra tools or remote agents.
+		var err error
+		adkAgent, err = agent.CreateWorkflowAgent(ctx, agentConfig, agentNameFromAppName(appName))
 		if err != nil {
-			return runner.Config{}, nil, fmt.Errorf("failed to create save_memory tool: %w", err)
+			return runner.Config{}, nil, fmt.Errorf("failed to create workflow agent: %w", err)
+		}
+		subagentSessionIDs = make(map[string]string)
+	} else {
+		var extraTools []adktool.Tool
+		if memoryService != nil {
+			saveTool, err := kagentmemory.NewSaveMemoryTool(memoryService)
+			if err != nil {
+				return runner.Config{}, nil, fmt.Errorf("failed to create save_memory tool: %w", err)
+			}
+			extraTools = append(extraTools, saveTool)
 		}
-		extraTools = append(extraTools, saveTool)
-	}
 
-	adkAgent, subagentSessionIDs, err := agent.CreateGoogleADKAgentWithSubagentSessionIDs(ctx, agentConfig, agentNameFromAppName(appName), extraTools...)
-	if err != nil {
-		return runner.Config{}, nil, fmt.Errorf("failed to create agent: %w", err)
+		var err error
+		adkAgent, subagentSessionIDs, err = agent.CreateGoogleADKAgentWithSubagentSessionIDs(ctx, agentConfig, agentNameFromAppName(appName), extraTools...)
+		if err != nil {
+			return runner.Config{}, nil, fmt.Errorf("failed to create agent: %w", err)
+		}
 	}
 
 	var adkSessionService adksession.Service