Sub-Agents

Decompose work across multiple specialized agents with a visible delegation log.

using System.ComponentModel;using System.Diagnostics.CodeAnalysis;using System.Net.Http;using System.Runtime.CompilerServices;using System.Text.Json;using System.Text.Json.Serialization;using Microsoft.Agents.AI;using Microsoft.Extensions.AI;using Microsoft.Extensions.Logging;using Microsoft.Extensions.Logging.Abstractions;using OpenAI;using System.ClientModel;// SubagentsAgent — backs the /subagents demo.//// Mirrors langgraph-python/src/agents/subagents.py and// google-adk/src/agents/subagents_agent.py:////   * A supervisor ChatClientAgent exposes three tools — `research_agent`,//     `writing_agent`, `critique_agent` — each of which delegates to a//     specialised sub-agent.////   * Each sub-agent is implemented as a single-shot secondary chat-client//     call with its own system prompt. This is conceptually identical to//     spawning a separate ChatClientAgent + Runner per delegation; we use a//     single-shot call here to keep the demo wiring tight (and to mirror the//     google-adk reference, which does the same with `genai.Client`).////   * Every delegation is recorded in `state.delegations` — a list of//     `Delegation { id, sub_agent, task, status, result }` records — and//     emitted to the UI as a state-snapshot DataContent payload after the//     supervisor's stream completes. (The snapshot also gets re-emitted on//     each tool call so the UI's `running` -> `completed` transition is//     visible mid-stream; see `EmitSnapshotAsync` below.)[SuppressMessage("Performance", "CA1812:Avoid uninstantiated internal classes", Justification = "Instantiated by SubagentsAgentFactory")]internal sealed class SubagentsAgent : DelegatingAIAgent{    private readonly ILogger<SubagentsAgent> _logger;    private readonly SubagentsStore _store;    public SubagentsAgent(        AIAgent innerAgent,        SubagentsStore store,        ILogger<SubagentsAgent>? logger = null)        : base(innerAgent)    {        ArgumentNullException.ThrowIfNull(innerAgent);        ArgumentNullException.ThrowIfNull(store);        _store = store;        _logger = logger ?? NullLogger<SubagentsAgent>.Instance;    }    public override Task<AgentRunResponse> RunAsync(IEnumerable<ChatMessage> messages, AgentThread? thread = null, AgentRunOptions? options = null, CancellationToken cancellationToken = default)    {        return RunStreamingAsync(messages, thread, options, cancellationToken).ToAgentRunResponseAsync(cancellationToken);    }    public override async IAsyncEnumerable<AgentRunResponseUpdate> RunStreamingAsync(        IEnumerable<ChatMessage> messages,        AgentThread? thread = null,        AgentRunOptions? options = null,        [EnumeratorCancellation] CancellationToken cancellationToken = default)    {        ArgumentNullException.ThrowIfNull(messages);        var messageList = messages as IReadOnlyList<ChatMessage> ?? messages.ToList();        // Bind the tool's read/write target to the current thread so each        // conversation appends to its own delegation list. The store        // exposes a per-thread "active" handle that the static tool        // function reads. We restore the previous value on exit so nested /        // overlapping runs don't trample each other.        var previous = (AgentThread?)_store.SetActiveThread(thread);        try        {            await foreach (var update in InnerAgent.RunStreamingAsync(messageList, thread, options, cancellationToken).ConfigureAwait(false))            {                yield return update;                // Flush any state changes the tool made during this update                // chunk. The inner ChatClientAgent doesn't emit DataContent                // for tool calls, so the UI would otherwise only see the                // final post-stream snapshot — losing the visible                // running -> completed transition that makes the demo                // compelling. We dedupe via SubagentsStore.TakeDirtyVersion                // so we don't spam identical snapshots across token chunks.                if (_store.TakeDirty(thread))                {                    var snapshot = _store.BuildSnapshot(thread);                    var bytes = JsonSerializer.SerializeToUtf8Bytes(                        snapshot,                        SubagentsSerializerContext.Default.SubagentsSnapshot);                    yield return new AgentRunResponseUpdate                    {                        Contents = [new DataContent(bytes, "application/json")],                    };                }            }        }        finally        {            _store.SetActiveThread(previous);        }        // Final snapshot — guarantees at least one state event per turn        // even if the supervisor produced no tool calls (so the UI sees a        // stable empty `delegations` list rather than `undefined`).        var finalSnapshot = _store.BuildSnapshot(thread);        var finalBytes = JsonSerializer.SerializeToUtf8Bytes(            finalSnapshot,            SubagentsSerializerContext.Default.SubagentsSnapshot);        yield return new AgentRunResponseUpdate        {            Contents = [new DataContent(finalBytes, "application/json")],        };    }}/// <summary>/// Per-thread store of delegation entries. Reads/writes are synchronized via/// a single lock — the demo workload is light and the lock is held only/// across the read-modify-write of an in-memory list./// </summary>internal sealed class SubagentsStore{    // Instance-scoped (not static) so multiple SubagentsStore instances —    // e.g. test helpers, future multi-tenant wiring — don't share global    // state with their per-instance `_slots` dict.    private readonly object _globalSlot = new();    private readonly AsyncLocal<object?> _activeThreadKey = new();    private readonly Dictionary<object, ThreadSlot> _slots = new();    private readonly object _lock = new();    public object? SetActiveThread(AgentThread? thread)    {        var prior = _activeThreadKey.Value;        _activeThreadKey.Value = thread ?? _globalSlot;        return prior;    }    public string AppendRunning(string subAgent, string task)    {        var entry = new SubagentDelegation(            Id: Guid.NewGuid().ToString("n")[..16],            SubAgent: subAgent,            Task: task,            Status: "running",            Result: "");        lock (_lock)        {            var slot = GetOrCreateSlot(_activeThreadKey.Value ?? _globalSlot);            slot.Delegations.Add(entry);            slot.DirtyVersion++;        }        return entry.Id;    }    public void Update(string id, string status, string result)    {        lock (_lock)        {            var slot = GetOrCreateSlot(_activeThreadKey.Value ?? _globalSlot);            for (var i = 0; i < slot.Delegations.Count; i++)            {                if (slot.Delegations[i].Id == id)                {                    slot.Delegations[i] = slot.Delegations[i] with                    {                        Status = status,                        Result = result,                    };                    slot.DirtyVersion++;                    return;                }            }        }    }    public bool TakeDirty(AgentThread? thread)    {        lock (_lock)        {            var key = (object?)thread ?? _globalSlot;            if (!_slots.TryGetValue(key, out var slot))            {                return false;            }            if (slot.DirtyVersion == slot.LastEmittedVersion)            {                return false;            }            slot.LastEmittedVersion = slot.DirtyVersion;            return true;        }    }    public SubagentsSnapshot BuildSnapshot(AgentThread? thread)    {        lock (_lock)        {            var key = (object?)thread ?? _globalSlot;            if (!_slots.TryGetValue(key, out var slot))            {                return new SubagentsSnapshot(Array.Empty<SubagentDelegation>());            }            // Defensive copy — caller may serialize after the lock releases.            return new SubagentsSnapshot(slot.Delegations.ToArray());        }    }    private ThreadSlot GetOrCreateSlot(object key)    {        if (!_slots.TryGetValue(key, out var slot))        {            slot = new ThreadSlot();            _slots[key] = slot;        }        return slot;    }    private sealed class ThreadSlot    {        public List<SubagentDelegation> Delegations { get; } = new();        public long DirtyVersion { get; set; }        public long LastEmittedVersion { get; set; }    }}internal sealed record SubagentDelegation(    [property: JsonPropertyName("id")] string Id,    [property: JsonPropertyName("sub_agent")] string SubAgent,    [property: JsonPropertyName("task")] string Task,    [property: JsonPropertyName("status")] string Status,    [property: JsonPropertyName("result")] string Result);internal sealed record SubagentsSnapshot(    [property: JsonPropertyName("delegations")] IReadOnlyList<SubagentDelegation> Delegations);[JsonSerializable(typeof(SubagentsSnapshot))][JsonSerializable(typeof(SubagentDelegation))][JsonSerializable(typeof(IReadOnlyList<SubagentDelegation>))]internal sealed partial class SubagentsSerializerContext : JsonSerializerContext;/// <summary>/// Factory that builds the supervisor agent + the three sub-agent tools./// Mounted in Program.cs at `/subagents`./// </summary>public sealed class SubagentsAgentFactory{    private const string DefaultOpenAiEndpoint = "https://models.inference.ai.azure.com";    private const string SubAgentModel = "gpt-4o-mini";    // Each sub-agent is a single-shot ChatClient call (built per-delegation    // in DelegateAsync) with its own system prompt. They don't share memory    // or tools with the supervisor — the supervisor only sees their return    // value as a tool result.    private const string ResearchSystemPrompt =        "You are a research sub-agent. Given a topic, produce a concise " +        "bulleted list of 3-5 key facts. No preamble, no closing.";    private const string WritingSystemPrompt =        "You are a writing sub-agent. Given a brief and optional source facts, " +        "produce a polished 1-paragraph draft. Be clear and concrete. No preamble.";    private const string CritiqueSystemPrompt =        "You are an editorial critique sub-agent. Given a draft, give 2-3 crisp, " +        "actionable critiques. No preamble.";    private const string SupervisorPrompt =        "You are a supervisor agent that coordinates three specialized " +        "sub-agents to produce high-quality deliverables.\n\n" +        "Available sub-agents (call them as tools):\n" +        "  - research_agent: gathers facts on a topic.\n" +        "  - writing_agent: turns facts + a brief into a polished draft.\n" +        "  - critique_agent: reviews a draft and suggests improvements.\n\n" +        "For most non-trivial user requests, delegate in sequence: research -> " +        "write -> critique. Pass relevant facts/draft through the `task` argument " +        "of each tool. Each tool returns a JSON object shaped " +        "{status: 'completed' | 'failed', result?: string, error?: string}. " +        "If a sub-agent fails, surface the failure briefly to the user (don't " +        "fabricate a result) and decide whether to retry. Keep your own " +        "messages short — explain the plan once, delegate, then return a " +        "concise summary once done. The UI shows the user a live log of " +        "every sub-agent delegation, including the in-flight 'running' state.";    private readonly OpenAIClient _openAiClient;    private readonly ILoggerFactory _loggerFactory;    private readonly ILogger _logger;    private readonly JsonSerializerOptions _jsonSerializerOptions;    private readonly SubagentsStore _store = new();    public SubagentsAgentFactory(        IConfiguration configuration,        ILoggerFactory loggerFactory,        JsonSerializerOptions jsonSerializerOptions)    {        ArgumentNullException.ThrowIfNull(configuration);        ArgumentNullException.ThrowIfNull(loggerFactory);        ArgumentNullException.ThrowIfNull(jsonSerializerOptions);        _loggerFactory = loggerFactory;        _logger = loggerFactory.CreateLogger<SubagentsAgentFactory>();        _jsonSerializerOptions = jsonSerializerOptions;        var githubToken = configuration["GitHubToken"]            ?? throw new InvalidOperationException(                "GitHubToken not found in configuration. " +                "Please set it using: dotnet user-secrets set GitHubToken \"<your-token>\" " +                "or get it using: gh auth token");        var endpoint = Environment.GetEnvironmentVariable("OPENAI_BASE_URL") ?? DefaultOpenAiEndpoint;        _openAiClient = new(            new ApiKeyCredential(githubToken),            AimockHeaderPolicy.CreateOpenAIClientOptions(endpoint));    }    public AIAgent CreateAgent()    {        var chatClient = _openAiClient.GetChatClient("gpt-4o-mini").AsIChatClient();        // Each sub-agent is exposed to the supervisor LLM as an AIFunction        // tool. When the supervisor invokes one, DelegateAsync runs a fresh        // ChatClient call with that sub-agent's system prompt, appends a        // Delegation entry to shared state, and returns the sub-agent's        // output to the supervisor as a tool result.        var research = AIFunctionFactory.Create(            (Func<string, CancellationToken, Task<string>>)((task, ct) =>                DelegateAsync("research_agent", ResearchSystemPrompt, task, ct)),            options: new()            {                Name = "research_agent",                Description = "Delegate a research task to the research sub-agent. Returns JSON {status, result?, error?}.",                SerializerOptions = _jsonSerializerOptions,            });        var writing = AIFunctionFactory.Create(            (Func<string, CancellationToken, Task<string>>)((task, ct) =>                DelegateAsync("writing_agent", WritingSystemPrompt, task, ct)),            options: new()            {                Name = "writing_agent",                Description = "Delegate a drafting task to the writing sub-agent. Returns JSON {status, result?, error?}.",                SerializerOptions = _jsonSerializerOptions,            });        var critique = AIFunctionFactory.Create(            (Func<string, CancellationToken, Task<string>>)((task, ct) =>                DelegateAsync("critique_agent", CritiqueSystemPrompt, task, ct)),            options: new()            {                Name = "critique_agent",                Description = "Delegate a critique task to the critique sub-agent. Returns JSON {status, result?, error?}.",                SerializerOptions = _jsonSerializerOptions,            });        var inner = new ChatClientAgent(            chatClient,            name: "SubagentsSupervisor",            description: SupervisorPrompt,            tools: [research, writing, critique]);        return new SubagentsAgent(inner, _store, _loggerFactory.CreateLogger<SubagentsAgent>());    }    /// <summary>    /// Common delegation flow — append a "running" entry, invoke a single-    /// shot secondary chat-client call, then update the entry to    /// "completed" / "failed". Returns a JSON string the supervisor LLM    /// reads as the tool result, mirroring the dict shape used by the    /// google-adk reference.    /// </summary>    private async Task<string> DelegateAsync(        string subAgent,        string systemPrompt,        string task,        CancellationToken cancellationToken)    {        ArgumentNullException.ThrowIfNull(task);        var entryId = _store.AppendRunning(subAgent, task);        _logger.LogInformation("subagent: starting {SubAgent} (entryId={EntryId}) task={TaskLength} chars", subAgent, entryId, task.Length);        try        {            var secondary = _openAiClient.GetChatClient(SubAgentModel).AsIChatClient();            var messages = new List<ChatMessage>            {                new(ChatRole.System, systemPrompt),                new(ChatRole.User, task),            };            var response = await secondary.GetResponseAsync(messages, cancellationToken: cancellationToken).ConfigureAwait(false);            var text = response.Text?.Trim() ?? "";            if (string.IsNullOrEmpty(text))            {                _logger.LogWarning("subagent: {SubAgent} returned no text content", subAgent);                _store.Update(entryId, "failed", "sub-agent returned empty text");                return JsonSerializer.Serialize(new { status = "failed", error = "sub-agent returned empty text" });            }            _store.Update(entryId, "completed", text);            return JsonSerializer.Serialize(new { status = "completed", result = text });        }        catch (HttpRequestException ex)        {            _logger.LogError(ex, "subagent: {SubAgent} transport failure", subAgent);            var msg = $"sub-agent call failed: {ex.GetType().Name} (see server logs)";            _store.Update(entryId, "failed", msg);            return JsonSerializer.Serialize(new { status = "failed", error = msg });        }        catch (ClientResultException ex)        {            _logger.LogError(ex, "subagent: {SubAgent} upstream returned status {Status}", subAgent, ex.Status);            var msg = $"sub-agent call failed: upstream returned error status {ex.Status}";            _store.Update(entryId, "failed", msg);            return JsonSerializer.Serialize(new { status = "failed", error = msg });        }        catch (OperationCanceledException)        {            _store.Update(entryId, "failed", "sub-agent call cancelled");            throw;        }    }}

What is this?#

Sub-agents are the canonical multi-agent pattern: a top-level supervisor LLM orchestrates one or more specialized sub-agents by exposing each of them as a tool. The supervisor decides what to delegate, the sub-agents do their narrow job, and their results flow back up to the supervisor's next step.

This is fundamentally the same shape as tool-calling, but each "tool" is itself a full-blown agent with its own system prompt and (often) its own tools, memory, and model.

When should I use this?#

Reach for sub-agents when a task has distinct specialized sub-tasks that each benefit from their own focus:

Research → Write → Critique pipelines, where each stage needs a different system prompt and temperature.
Router + specialists, where one agent classifies the request and dispatches to the right expert.
Divide-and-conquer — any problem that fits cleanly into parallel or sequential sub-problems.

The example below uses the Research → Write → Critique shape as the canonical example.

Setting up sub-agents#

Each sub-agent is a full create_agent(...) call with its own model, its own system prompt, and (optionally) its own tools. They don't share memory or tools with the supervisor; the supervisor only ever sees what the sub-agent returns.

SubagentsAgent.cs

using System.ComponentModel;using System.Diagnostics.CodeAnalysis;using System.Net.Http;using System.Runtime.CompilerServices;using System.Text.Json;using System.Text.Json.Serialization;using Microsoft.Agents.AI;using Microsoft.Extensions.AI;using Microsoft.Extensions.Logging;using Microsoft.Extensions.Logging.Abstractions;using OpenAI;using System.ClientModel;// SubagentsAgent — backs the /subagents demo.//// Mirrors langgraph-python/src/agents/subagents.py and// google-adk/src/agents/subagents_agent.py:////   * A supervisor ChatClientAgent exposes three tools — `research_agent`,//     `writing_agent`, `critique_agent` — each of which delegates to a//     specialised sub-agent.////   * Each sub-agent is implemented as a single-shot secondary chat-client//     call with its own system prompt. This is conceptually identical to//     spawning a separate ChatClientAgent + Runner per delegation; we use a//     single-shot call here to keep the demo wiring tight (and to mirror the//     google-adk reference, which does the same with `genai.Client`).////   * Every delegation is recorded in `state.delegations` — a list of//     `Delegation { id, sub_agent, task, status, result }` records — and//     emitted to the UI as a state-snapshot DataContent payload after the//     supervisor's stream completes. (The snapshot also gets re-emitted on//     each tool call so the UI's `running` -> `completed` transition is//     visible mid-stream; see `EmitSnapshotAsync` below.)[SuppressMessage("Performance", "CA1812:Avoid uninstantiated internal classes", Justification = "Instantiated by SubagentsAgentFactory")]internal sealed class SubagentsAgent : DelegatingAIAgent{    private readonly ILogger<SubagentsAgent> _logger;    private readonly SubagentsStore _store;    public SubagentsAgent(        AIAgent innerAgent,        SubagentsStore store,        ILogger<SubagentsAgent>? logger = null)        : base(innerAgent)    {        ArgumentNullException.ThrowIfNull(innerAgent);        ArgumentNullException.ThrowIfNull(store);        _store = store;        _logger = logger ?? NullLogger<SubagentsAgent>.Instance;    }    public override Task<AgentRunResponse> RunAsync(IEnumerable<ChatMessage> messages, AgentThread? thread = null, AgentRunOptions? options = null, CancellationToken cancellationToken = default)    {        return RunStreamingAsync(messages, thread, options, cancellationToken).ToAgentRunResponseAsync(cancellationToken);    }    public override async IAsyncEnumerable<AgentRunResponseUpdate> RunStreamingAsync(        IEnumerable<ChatMessage> messages,        AgentThread? thread = null,        AgentRunOptions? options = null,        [EnumeratorCancellation] CancellationToken cancellationToken = default)    {        ArgumentNullException.ThrowIfNull(messages);        var messageList = messages as IReadOnlyList<ChatMessage> ?? messages.ToList();        // Bind the tool's read/write target to the current thread so each        // conversation appends to its own delegation list. The store        // exposes a per-thread "active" handle that the static tool        // function reads. We restore the previous value on exit so nested /        // overlapping runs don't trample each other.        var previous = (AgentThread?)_store.SetActiveThread(thread);        try        {            await foreach (var update in InnerAgent.RunStreamingAsync(messageList, thread, options, cancellationToken).ConfigureAwait(false))            {                yield return update;                // Flush any state changes the tool made during this update                // chunk. The inner ChatClientAgent doesn't emit DataContent                // for tool calls, so the UI would otherwise only see the                // final post-stream snapshot — losing the visible                // running -> completed transition that makes the demo                // compelling. We dedupe via SubagentsStore.TakeDirtyVersion                // so we don't spam identical snapshots across token chunks.                if (_store.TakeDirty(thread))                {                    var snapshot = _store.BuildSnapshot(thread);                    var bytes = JsonSerializer.SerializeToUtf8Bytes(                        snapshot,                        SubagentsSerializerContext.Default.SubagentsSnapshot);                    yield return new AgentRunResponseUpdate                    {                        Contents = [new DataContent(bytes, "application/json")],                    };                }            }        }        finally        {            _store.SetActiveThread(previous);        }        // Final snapshot — guarantees at least one state event per turn        // even if the supervisor produced no tool calls (so the UI sees a        // stable empty `delegations` list rather than `undefined`).        var finalSnapshot = _store.BuildSnapshot(thread);        var finalBytes = JsonSerializer.SerializeToUtf8Bytes(            finalSnapshot,            SubagentsSerializerContext.Default.SubagentsSnapshot);        yield return new AgentRunResponseUpdate        {            Contents = [new DataContent(finalBytes, "application/json")],        };    }}/// <summary>/// Per-thread store of delegation entries. Reads/writes are synchronized via/// a single lock — the demo workload is light and the lock is held only/// across the read-modify-write of an in-memory list./// </summary>internal sealed class SubagentsStore{    // Instance-scoped (not static) so multiple SubagentsStore instances —    // e.g. test helpers, future multi-tenant wiring — don't share global    // state with their per-instance `_slots` dict.    private readonly object _globalSlot = new();    private readonly AsyncLocal<object?> _activeThreadKey = new();    private readonly Dictionary<object, ThreadSlot> _slots = new();    private readonly object _lock = new();    public object? SetActiveThread(AgentThread? thread)    {        var prior = _activeThreadKey.Value;        _activeThreadKey.Value = thread ?? _globalSlot;        return prior;    }    public string AppendRunning(string subAgent, string task)    {        var entry = new SubagentDelegation(            Id: Guid.NewGuid().ToString("n")[..16],            SubAgent: subAgent,            Task: task,            Status: "running",            Result: "");        lock (_lock)        {            var slot = GetOrCreateSlot(_activeThreadKey.Value ?? _globalSlot);            slot.Delegations.Add(entry);            slot.DirtyVersion++;        }        return entry.Id;    }    public void Update(string id, string status, string result)    {        lock (_lock)        {            var slot = GetOrCreateSlot(_activeThreadKey.Value ?? _globalSlot);            for (var i = 0; i < slot.Delegations.Count; i++)            {                if (slot.Delegations[i].Id == id)                {                    slot.Delegations[i] = slot.Delegations[i] with                    {                        Status = status,                        Result = result,                    };                    slot.DirtyVersion++;                    return;                }            }        }    }    public bool TakeDirty(AgentThread? thread)    {        lock (_lock)        {            var key = (object?)thread ?? _globalSlot;            if (!_slots.TryGetValue(key, out var slot))            {                return false;            }            if (slot.DirtyVersion == slot.LastEmittedVersion)            {                return false;            }            slot.LastEmittedVersion = slot.DirtyVersion;            return true;        }    }    public SubagentsSnapshot BuildSnapshot(AgentThread? thread)    {        lock (_lock)        {            var key = (object?)thread ?? _globalSlot;            if (!_slots.TryGetValue(key, out var slot))            {                return new SubagentsSnapshot(Array.Empty<SubagentDelegation>());            }            // Defensive copy — caller may serialize after the lock releases.            return new SubagentsSnapshot(slot.Delegations.ToArray());        }    }    private ThreadSlot GetOrCreateSlot(object key)    {        if (!_slots.TryGetValue(key, out var slot))        {            slot = new ThreadSlot();            _slots[key] = slot;        }        return slot;    }    private sealed class ThreadSlot    {        public List<SubagentDelegation> Delegations { get; } = new();        public long DirtyVersion { get; set; }        public long LastEmittedVersion { get; set; }    }}internal sealed record SubagentDelegation(    [property: JsonPropertyName("id")] string Id,    [property: JsonPropertyName("sub_agent")] string SubAgent,    [property: JsonPropertyName("task")] string Task,    [property: JsonPropertyName("status")] string Status,    [property: JsonPropertyName("result")] string Result);internal sealed record SubagentsSnapshot(    [property: JsonPropertyName("delegations")] IReadOnlyList<SubagentDelegation> Delegations);[JsonSerializable(typeof(SubagentsSnapshot))][JsonSerializable(typeof(SubagentDelegation))][JsonSerializable(typeof(IReadOnlyList<SubagentDelegation>))]internal sealed partial class SubagentsSerializerContext : JsonSerializerContext;/// <summary>/// Factory that builds the supervisor agent + the three sub-agent tools./// Mounted in Program.cs at `/subagents`./// </summary>public sealed class SubagentsAgentFactory{    private const string DefaultOpenAiEndpoint = "https://models.inference.ai.azure.com";    private const string SubAgentModel = "gpt-4o-mini";    // Each sub-agent is a single-shot ChatClient call (built per-delegation    // in DelegateAsync) with its own system prompt. They don't share memory    // or tools with the supervisor — the supervisor only sees their return    // value as a tool result.    private const string ResearchSystemPrompt =        "You are a research sub-agent. Given a topic, produce a concise " +        "bulleted list of 3-5 key facts. No preamble, no closing.";    private const string WritingSystemPrompt =        "You are a writing sub-agent. Given a brief and optional source facts, " +        "produce a polished 1-paragraph draft. Be clear and concrete. No preamble.";    private const string CritiqueSystemPrompt =        "You are an editorial critique sub-agent. Given a draft, give 2-3 crisp, " +        "actionable critiques. No preamble.";

Keep sub-agent system prompts narrow and focused. The point of this pattern is that each one does one thing well. If a sub-agent needs to know the whole user context to do its job, that's a signal the boundary is wrong.

Exposing sub-agents as tools#

The supervisor delegates by calling tools. Each tool is a thin wrapper around sub_agent.invoke(...) that:

Runs the sub-agent synchronously on the supplied task string.
Records the delegation into a delegations slot in shared agent state (so the UI can render a live log).
Returns the sub-agent's final message as a ToolMessage, which the supervisor sees as a normal tool result on its next turn.

SubagentsAgent.cs

using System.ComponentModel;using System.Diagnostics.CodeAnalysis;using System.Net.Http;using System.Runtime.CompilerServices;using System.Text.Json;using System.Text.Json.Serialization;using Microsoft.Agents.AI;using Microsoft.Extensions.AI;using Microsoft.Extensions.Logging;using Microsoft.Extensions.Logging.Abstractions;using OpenAI;using System.ClientModel;// SubagentsAgent — backs the /subagents demo.//// Mirrors langgraph-python/src/agents/subagents.py and// google-adk/src/agents/subagents_agent.py:////   * A supervisor ChatClientAgent exposes three tools — `research_agent`,//     `writing_agent`, `critique_agent` — each of which delegates to a//     specialised sub-agent.////   * Each sub-agent is implemented as a single-shot secondary chat-client//     call with its own system prompt. This is conceptually identical to//     spawning a separate ChatClientAgent + Runner per delegation; we use a//     single-shot call here to keep the demo wiring tight (and to mirror the//     google-adk reference, which does the same with `genai.Client`).////   * Every delegation is recorded in `state.delegations` — a list of//     `Delegation { id, sub_agent, task, status, result }` records — and//     emitted to the UI as a state-snapshot DataContent payload after the//     supervisor's stream completes. (The snapshot also gets re-emitted on//     each tool call so the UI's `running` -> `completed` transition is//     visible mid-stream; see `EmitSnapshotAsync` below.)[SuppressMessage("Performance", "CA1812:Avoid uninstantiated internal classes", Justification = "Instantiated by SubagentsAgentFactory")]internal sealed class SubagentsAgent : DelegatingAIAgent{    private readonly ILogger<SubagentsAgent> _logger;    private readonly SubagentsStore _store;    public SubagentsAgent(        AIAgent innerAgent,        SubagentsStore store,        ILogger<SubagentsAgent>? logger = null)        : base(innerAgent)    {        ArgumentNullException.ThrowIfNull(innerAgent);        ArgumentNullException.ThrowIfNull(store);        _store = store;        _logger = logger ?? NullLogger<SubagentsAgent>.Instance;    }    public override Task<AgentRunResponse> RunAsync(IEnumerable<ChatMessage> messages, AgentThread? thread = null, AgentRunOptions? options = null, CancellationToken cancellationToken = default)    {        return RunStreamingAsync(messages, thread, options, cancellationToken).ToAgentRunResponseAsync(cancellationToken);    }    public override async IAsyncEnumerable<AgentRunResponseUpdate> RunStreamingAsync(        IEnumerable<ChatMessage> messages,        AgentThread? thread = null,        AgentRunOptions? options = null,        [EnumeratorCancellation] CancellationToken cancellationToken = default)    {        ArgumentNullException.ThrowIfNull(messages);        var messageList = messages as IReadOnlyList<ChatMessage> ?? messages.ToList();        // Bind the tool's read/write target to the current thread so each        // conversation appends to its own delegation list. The store        // exposes a per-thread "active" handle that the static tool        // function reads. We restore the previous value on exit so nested /        // overlapping runs don't trample each other.        var previous = (AgentThread?)_store.SetActiveThread(thread);        try        {            await foreach (var update in InnerAgent.RunStreamingAsync(messageList, thread, options, cancellationToken).ConfigureAwait(false))            {                yield return update;                // Flush any state changes the tool made during this update                // chunk. The inner ChatClientAgent doesn't emit DataContent                // for tool calls, so the UI would otherwise only see the                // final post-stream snapshot — losing the visible                // running -> completed transition that makes the demo                // compelling. We dedupe via SubagentsStore.TakeDirtyVersion                // so we don't spam identical snapshots across token chunks.                if (_store.TakeDirty(thread))                {                    var snapshot = _store.BuildSnapshot(thread);                    var bytes = JsonSerializer.SerializeToUtf8Bytes(                        snapshot,                        SubagentsSerializerContext.Default.SubagentsSnapshot);                    yield return new AgentRunResponseUpdate                    {                        Contents = [new DataContent(bytes, "application/json")],                    };                }            }        }        finally        {            _store.SetActiveThread(previous);        }        // Final snapshot — guarantees at least one state event per turn        // even if the supervisor produced no tool calls (so the UI sees a        // stable empty `delegations` list rather than `undefined`).        var finalSnapshot = _store.BuildSnapshot(thread);        var finalBytes = JsonSerializer.SerializeToUtf8Bytes(            finalSnapshot,            SubagentsSerializerContext.Default.SubagentsSnapshot);        yield return new AgentRunResponseUpdate        {            Contents = [new DataContent(finalBytes, "application/json")],        };    }}/// <summary>/// Per-thread store of delegation entries. Reads/writes are synchronized via/// a single lock — the demo workload is light and the lock is held only/// across the read-modify-write of an in-memory list./// </summary>internal sealed class SubagentsStore{    // Instance-scoped (not static) so multiple SubagentsStore instances —    // e.g. test helpers, future multi-tenant wiring — don't share global    // state with their per-instance `_slots` dict.    private readonly object _globalSlot = new();    private readonly AsyncLocal<object?> _activeThreadKey = new();    private readonly Dictionary<object, ThreadSlot> _slots = new();    private readonly object _lock = new();    public object? SetActiveThread(AgentThread? thread)    {        var prior = _activeThreadKey.Value;        _activeThreadKey.Value = thread ?? _globalSlot;        return prior;    }    public string AppendRunning(string subAgent, string task)    {        var entry = new SubagentDelegation(            Id: Guid.NewGuid().ToString("n")[..16],            SubAgent: subAgent,            Task: task,            Status: "running",            Result: "");        lock (_lock)        {            var slot = GetOrCreateSlot(_activeThreadKey.Value ?? _globalSlot);            slot.Delegations.Add(entry);            slot.DirtyVersion++;        }        return entry.Id;    }    public void Update(string id, string status, string result)    {        lock (_lock)        {            var slot = GetOrCreateSlot(_activeThreadKey.Value ?? _globalSlot);            for (var i = 0; i < slot.Delegations.Count; i++)            {                if (slot.Delegations[i].Id == id)                {                    slot.Delegations[i] = slot.Delegations[i] with                    {                        Status = status,                        Result = result,                    };                    slot.DirtyVersion++;                    return;                }            }        }    }    public bool TakeDirty(AgentThread? thread)    {        lock (_lock)        {            var key = (object?)thread ?? _globalSlot;            if (!_slots.TryGetValue(key, out var slot))            {                return false;            }            if (slot.DirtyVersion == slot.LastEmittedVersion)            {                return false;            }            slot.LastEmittedVersion = slot.DirtyVersion;            return true;        }    }    public SubagentsSnapshot BuildSnapshot(AgentThread? thread)    {        lock (_lock)        {            var key = (object?)thread ?? _globalSlot;            if (!_slots.TryGetValue(key, out var slot))            {                return new SubagentsSnapshot(Array.Empty<SubagentDelegation>());            }            // Defensive copy — caller may serialize after the lock releases.            return new SubagentsSnapshot(slot.Delegations.ToArray());        }    }    private ThreadSlot GetOrCreateSlot(object key)    {        if (!_slots.TryGetValue(key, out var slot))        {            slot = new ThreadSlot();            _slots[key] = slot;        }        return slot;    }    private sealed class ThreadSlot    {        public List<SubagentDelegation> Delegations { get; } = new();        public long DirtyVersion { get; set; }        public long LastEmittedVersion { get; set; }    }}internal sealed record SubagentDelegation(    [property: JsonPropertyName("id")] string Id,    [property: JsonPropertyName("sub_agent")] string SubAgent,    [property: JsonPropertyName("task")] string Task,    [property: JsonPropertyName("status")] string Status,    [property: JsonPropertyName("result")] string Result);internal sealed record SubagentsSnapshot(    [property: JsonPropertyName("delegations")] IReadOnlyList<SubagentDelegation> Delegations);[JsonSerializable(typeof(SubagentsSnapshot))][JsonSerializable(typeof(SubagentDelegation))][JsonSerializable(typeof(IReadOnlyList<SubagentDelegation>))]internal sealed partial class SubagentsSerializerContext : JsonSerializerContext;/// <summary>/// Factory that builds the supervisor agent + the three sub-agent tools./// Mounted in Program.cs at `/subagents`./// </summary>public sealed class SubagentsAgentFactory{    private const string DefaultOpenAiEndpoint = "https://models.inference.ai.azure.com";    private const string SubAgentModel = "gpt-4o-mini";    // Each sub-agent is a single-shot ChatClient call (built per-delegation    // in DelegateAsync) with its own system prompt. They don't share memory    // or tools with the supervisor — the supervisor only sees their return    // value as a tool result.    private const string ResearchSystemPrompt =        "You are a research sub-agent. Given a topic, produce a concise " +        "bulleted list of 3-5 key facts. No preamble, no closing.";    private const string WritingSystemPrompt =        "You are a writing sub-agent. Given a brief and optional source facts, " +        "produce a polished 1-paragraph draft. Be clear and concrete. No preamble.";    private const string CritiqueSystemPrompt =        "You are an editorial critique sub-agent. Given a draft, give 2-3 crisp, " +        "actionable critiques. No preamble.";    private const string SupervisorPrompt =        "You are a supervisor agent that coordinates three specialized " +        "sub-agents to produce high-quality deliverables.\n\n" +        "Available sub-agents (call them as tools):\n" +        "  - research_agent: gathers facts on a topic.\n" +        "  - writing_agent: turns facts + a brief into a polished draft.\n" +        "  - critique_agent: reviews a draft and suggests improvements.\n\n" +        "For most non-trivial user requests, delegate in sequence: research -> " +        "write -> critique. Pass relevant facts/draft through the `task` argument " +        "of each tool. Each tool returns a JSON object shaped " +        "{status: 'completed' | 'failed', result?: string, error?: string}. " +        "If a sub-agent fails, surface the failure briefly to the user (don't " +        "fabricate a result) and decide whether to retry. Keep your own " +        "messages short — explain the plan once, delegate, then return a " +        "concise summary once done. The UI shows the user a live log of " +        "every sub-agent delegation, including the in-flight 'running' state.";    private readonly OpenAIClient _openAiClient;    private readonly ILoggerFactory _loggerFactory;    private readonly ILogger _logger;    private readonly JsonSerializerOptions _jsonSerializerOptions;    private readonly SubagentsStore _store = new();    public SubagentsAgentFactory(        IConfiguration configuration,        ILoggerFactory loggerFactory,        JsonSerializerOptions jsonSerializerOptions)    {        ArgumentNullException.ThrowIfNull(configuration);        ArgumentNullException.ThrowIfNull(loggerFactory);        ArgumentNullException.ThrowIfNull(jsonSerializerOptions);        _loggerFactory = loggerFactory;        _logger = loggerFactory.CreateLogger<SubagentsAgentFactory>();        _jsonSerializerOptions = jsonSerializerOptions;        var githubToken = configuration["GitHubToken"]            ?? throw new InvalidOperationException(                "GitHubToken not found in configuration. " +                "Please set it using: dotnet user-secrets set GitHubToken \"<your-token>\" " +                "or get it using: gh auth token");        var endpoint = Environment.GetEnvironmentVariable("OPENAI_BASE_URL") ?? DefaultOpenAiEndpoint;        _openAiClient = new(            new ApiKeyCredential(githubToken),            AimockHeaderPolicy.CreateOpenAIClientOptions(endpoint));    }    public AIAgent CreateAgent()    {        var chatClient = _openAiClient.GetChatClient("gpt-4o-mini").AsIChatClient();        // Each sub-agent is exposed to the supervisor LLM as an AIFunction        // tool. When the supervisor invokes one, DelegateAsync runs a fresh        // ChatClient call with that sub-agent's system prompt, appends a        // Delegation entry to shared state, and returns the sub-agent's        // output to the supervisor as a tool result.        var research = AIFunctionFactory.Create(            (Func<string, CancellationToken, Task<string>>)((task, ct) =>                DelegateAsync("research_agent", ResearchSystemPrompt, task, ct)),            options: new()            {                Name = "research_agent",                Description = "Delegate a research task to the research sub-agent. Returns JSON {status, result?, error?}.",                SerializerOptions = _jsonSerializerOptions,            });        var writing = AIFunctionFactory.Create(            (Func<string, CancellationToken, Task<string>>)((task, ct) =>                DelegateAsync("writing_agent", WritingSystemPrompt, task, ct)),            options: new()            {                Name = "writing_agent",                Description = "Delegate a drafting task to the writing sub-agent. Returns JSON {status, result?, error?}.",                SerializerOptions = _jsonSerializerOptions,            });        var critique = AIFunctionFactory.Create(            (Func<string, CancellationToken, Task<string>>)((task, ct) =>                DelegateAsync("critique_agent", CritiqueSystemPrompt, task, ct)),            options: new()            {                Name = "critique_agent",                Description = "Delegate a critique task to the critique sub-agent. Returns JSON {status, result?, error?}.",                SerializerOptions = _jsonSerializerOptions,            });

This is where CopilotKit's shared-state channel earns its keep: the supervisor's tool calls mutate delegations as they happen, and the frontend renders every new entry live.

Rendering a live delegation log#

On the frontend, the delegation log is just a reactive render of the delegations slot. Subscribe with useAgent({ updates: [UseAgentUpdate.OnStateChanged, UseAgentUpdate.OnRunStatusChanged] }), read agent.state.delegations, and render one card per entry.

delegation-log.tsx

/** * Live delegation log — renders the `delegations` slot of agent state. * * Each entry corresponds to one invocation of a sub-agent. The list * grows in real time as the supervisor fans work out to its children. * The parent header shows how many sub-agents have been called and * whether the supervisor is still running. */// Fixed list of the three sub-agent roles the supervisor can call.// Rendered as always-visible indicator chips at the top of the log// (regardless of whether the supervisor has delegated yet) so the user// — and the e2e suite — can see at a glance which sub-agents exist and// which are currently active.const INDICATOR_ROLES: ReadonlyArray<{  role: "researcher" | "writer" | "critic";  subAgent: SubAgentName;}> = [  { role: "researcher", subAgent: "research_agent" },  { role: "writer", subAgent: "writing_agent" },  { role: "critic", subAgent: "critique_agent" },];export function DelegationLog({ delegations, isRunning }: DelegationLogProps) {  const calledRoles = new Set<SubAgentName>(    delegations.map((d) => d.sub_agent),  );  return (    <div      data-testid="delegation-log"      className="w-full h-full flex flex-col bg-white rounded-2xl shadow-sm border border-[#DBDBE5] overflow-hidden"    >      <div className="flex items-center justify-between px-6 py-3 border-b border-[#E9E9EF] bg-[#FAFAFC]">        <div className="flex items-center gap-3">          <span className="text-lg font-semibold text-[#010507]">            Sub-agent delegations          </span>          {isRunning && (            <span              data-testid="supervisor-running"              className="inline-flex items-center gap-1.5 px-2 py-0.5 rounded-full border border-[#BEC2FF] bg-[#BEC2FF1A] text-[#010507] text-[10px] font-semibold uppercase tracking-[0.12em]"            >              <span className="w-1.5 h-1.5 rounded-full bg-[#010507] animate-pulse" />              Supervisor running            </span>          )}        </div>        <span          data-testid="delegation-count"          className="text-xs font-mono text-[#838389]"        >          {delegations.length} calls        </span>      </div>      <div        data-testid="subagent-indicators"        className="flex items-center gap-2 border-b border-[#E9E9EF] bg-white px-6 py-2"      >        {INDICATOR_ROLES.map(({ role, subAgent }) => {          const style = SUB_AGENT_STYLE[subAgent];          const fired = calledRoles.has(subAgent);          return (            <span              key={role}              data-testid={`subagent-indicator-${role}`}              data-role={role}              data-fired={fired ? "true" : "false"}              className={`inline-flex items-center gap-1 px-2 py-0.5 rounded-full text-[10px] font-semibold uppercase tracking-[0.1em] border ${style.color} ${                fired ? "" : "opacity-60"              }`}            >              <span aria-hidden>{style.emoji}</span>              <span>{style.label}</span>            </span>          );        })}      </div>      <div className="flex-1 overflow-y-auto p-4 space-y-3">        {delegations.length === 0 ? (          <p className="text-[#838389] italic text-sm">            Ask the supervisor to complete a task. Every sub-agent it calls will            appear here.          </p>        ) : (          delegations.map((d, idx) => {            const style = SUB_AGENT_STYLE[d.sub_agent];            return (              <div                key={d.id}                data-testid="delegation-entry"                className="border border-[#E9E9EF] rounded-xl p-3 bg-[#FAFAFC]"              >                <div className="flex items-center justify-between mb-2">                  <div className="flex items-center gap-2">                    <span className="text-xs font-mono text-[#AFAFB7]">                      #{idx + 1}                    </span>                    <span                      className={`inline-flex items-center gap-1 px-2 py-0.5 rounded-full text-[10px] font-semibold uppercase tracking-[0.1em] border ${style.color}`}                    >                      <span>{style.emoji}</span>                      <span>{style.label}</span>                    </span>                  </div>                  <span className="text-[10px] uppercase tracking-[0.12em] font-semibold text-[#189370]">                    {d.status}                  </span>                </div>                <div className="text-xs text-[#57575B] mb-2">                  <span className="font-semibold text-[#010507]">Task: </span>                  {d.task}                </div>                <div className="text-sm text-[#010507] whitespace-pre-wrap bg-white rounded-lg p-2.5 border border-[#E9E9EF]">                  {d.result}                </div>              </div>            );          })        )}      </div>    </div>  );}

The result: as the supervisor fans work out to its sub-agents, the log grows in real time, giving the user visibility into a process that would otherwise be a long opaque spinner.

Shared State — the channel that makes the delegation log live.
State streaming — stream individual sub-agent outputs token-by-token inside each log entry.