docker
diff --git a/‎.dockerignore‎
Lines changed: 1 addition & 0 deletions b/‎.dockerignore‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎cmd/root/chat.go‎
Lines changed: 98 additions & 0 deletions b/‎cmd/root/chat.go‎
Lines changed: 98 additions & 0 deletions
diff --git a/‎cmd/root/serve.go‎
Lines changed: 2 additions & 1 deletion b/‎cmd/root/serve.go‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎e2e/binary/binary_test.go‎
Lines changed: 3 additions & 2 deletions b/‎e2e/binary/binary_test.go‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎examples/chat/main.go‎
Lines changed: 174 additions & 0 deletions b/‎examples/chat/main.go‎
Lines changed: 174 additions & 0 deletions
@@ -7,5 +7,6 @@
 !./**/*.css
 !./**/*.go
 !./**/*.txt
+!/pkg/chatserver/openapi.json
 !/pkg/config/builtin-agents/*.yaml
 !/pkg/tui/styles/themes/*.yaml
@@ -0,0 +1,98 @@
+package root
+
+import (
+	"os"
+	"time"
+
+	"github.com/spf13/cobra"
+
+	"github.com/docker/docker-agent/pkg/chatserver"
+	"github.com/docker/docker-agent/pkg/cli"
+	"github.com/docker/docker-agent/pkg/config"
+	"github.com/docker/docker-agent/pkg/telemetry"
+)
+
+type chatFlags struct {
+	agentName             string
+	listenAddr            string
+	corsOrigin            string
+	apiKey                string
+	apiKeyEnv             string
+	maxRequestSize        int64
+	requestTimeout        time.Duration
+	conversationsMaxItems int
+	conversationTTL       time.Duration
+	maxIdleRuntimes       int
+	runConfig             config.RuntimeConfig
+}
+
+func newChatCmd() *cobra.Command {
+	var flags chatFlags
+
+	cmd := &cobra.Command{
+		Use:   "chat <agent-file>|<registry-ref>",
+		Short: "Start an agent as an OpenAI-compatible chat completions server",
+		Long: `Start an HTTP server that exposes the agent through an OpenAI-compatible
+API at /v1/chat/completions and /v1/models. This lets tools that already
+speak OpenAI's chat protocol (such as Open WebUI) drive a docker-agent
+agent without any custom integration.`,
+		Example: `  docker-agent serve chat ./agent.yaml
+  docker-agent serve chat ./team.yaml --agent reviewer
+  docker-agent serve chat agentcatalog/pirate --listen 127.0.0.1:9090`,
+		Args: cobra.ExactArgs(1),
+		RunE: flags.runChatCommand,
+	}
+
+	cmd.Flags().StringVarP(&flags.agentName, "agent", "a", "", "Name of the agent to expose (all agents if not specified)")
+	cmd.Flags().StringVarP(&flags.listenAddr, "listen", "l", "127.0.0.1:8083", "Address to listen on")
+	cmd.Flags().StringVar(&flags.corsOrigin, "cors-origin", "", "Allowed CORS origin (e.g. https://example.com); empty disables CORS entirely")
+	cmd.Flags().StringVar(&flags.apiKey, "api-key", "", "Required Bearer token clients must present (Authorization: Bearer <token>); empty disables auth")
+	cmd.Flags().StringVar(&flags.apiKeyEnv, "api-key-env", "", "Read the API key from this environment variable instead of the command line")
+	cmd.Flags().Int64Var(&flags.maxRequestSize, "max-request-size", 1<<20, "Maximum request body size in bytes (default 1 MiB)")
+	cmd.Flags().DurationVar(&flags.requestTimeout, "request-timeout", 5*time.Minute, "Per-request timeout (covers model + tool calls + streaming)")
+	cmd.Flags().IntVar(&flags.conversationsMaxItems, "conversations-max", 0, "Cache up to N conversations server-side, keyed by X-Conversation-Id (0 disables; clients must resend full history)")
+	cmd.Flags().DurationVar(&flags.conversationTTL, "conversation-ttl", 30*time.Minute, "Idle TTL after which a cached conversation is evicted")
+	cmd.Flags().IntVar(&flags.maxIdleRuntimes, "max-idle-runtimes", 4, "Maximum number of idle runtimes pooled per agent (0 disables pooling)")
+	addRuntimeConfigFlags(cmd, &flags.runConfig)
+
+	return cmd
+}
+
+func (f *chatFlags) runChatCommand(cmd *cobra.Command, args []string) (commandErr error) {
+	ctx := cmd.Context()
+	telemetry.TrackCommand(ctx, "serve", append([]string{"chat"}, args...))
+	defer func() { // do not inline this defer so that commandErr is not resolved early
+		telemetry.TrackCommandError(ctx, "serve", append([]string{"chat"}, args...), commandErr)
+	}()
+
+	out := cli.NewPrinter(cmd.OutOrStdout())
+	agentFilename := args[0]
+
+	ln, cleanup, err := newListener(ctx, f.listenAddr)
+	if err != nil {
+		return err
+	}
+	defer cleanup()
+
+	out.Println("Listening on", ln.Addr().String())
+	out.Println("OpenAI-compatible chat completions endpoint: http://" + ln.Addr().String() + "/v1/chat/completions")
+
+	apiKey := f.apiKey
+	if f.apiKeyEnv != "" {
+		if v := os.Getenv(f.apiKeyEnv); v != "" {
+			apiKey = v
+		}
+	}
+
+	return chatserver.Run(ctx, agentFilename, chatserver.Options{
+		AgentName:                f.agentName,
+		RunConfig:                &f.runConfig,
+		CORSOrigin:               f.corsOrigin,
+		APIKey:                   apiKey,
+		MaxRequestBytes:          f.maxRequestSize,
+		RequestTimeout:           f.requestTimeout,
+		ConversationsMaxSessions: f.conversationsMaxItems,
+		ConversationTTL:          f.conversationTTL,
+		MaxIdleRuntimes:          f.maxIdleRuntimes,
+	}, ln)
+}
@@ -13,8 +13,9 @@ func newServeCmd() *cobra.Command {
 
 	cmd.AddCommand(newA2ACmd())
 	cmd.AddCommand(newACPCmd())
-	cmd.AddCommand(newMCPCmd())
 	cmd.AddCommand(newAPICmd())
+	cmd.AddCommand(newChatCmd())
+	cmd.AddCommand(newMCPCmd())
 
 	return cmd
 }
@@ -54,12 +54,13 @@ func TestAutoComplete(t *testing.T) {
 		res, err := Exec(binDir+"/docker-agent", "__complete", "serve", "")
 		require.NoError(t, err)
 		props := lines(res.Stdout)
-		require.Greater(t, len(props), 4)
+		require.Greater(t, len(props), 5)
 		require.Contains(t, props[0], "a2a")
 		require.Contains(t, props[0], "Start an agent as an A2A")
 		require.Contains(t, props[1], "acp")
 		require.Contains(t, props[2], "api")
-		require.Contains(t, props[3], "mcp")
+		require.Contains(t, props[3], "chat")
+		require.Contains(t, props[4], "mcp")
 	})
 
 	t.Run("cli plugin auto-complete docker agent", func(t *testing.T) {
 
@@ -0,0 +1,174 @@
+// A very, very basic chat client for `docker agent serve chat`.
+//
+// PR #2510 (`feat: add docker agent serve chat command`) exposes any
+// docker-agent agent through an OpenAI-compatible HTTP server. The whole
+// point of that feature is that any tool already speaking OpenAI's
+// /v1/chat/completions protocol can drive a docker-agent agent without
+// custom integration. This example demonstrates exactly that: it uses the
+// official github.com/openai/openai-go SDK, only repointed at the local
+// chat server, to run an interactive REPL against an agent.
+//
+// Prerequisites:
+//
+//	# Start an agent in chat mode (in another terminal):
+//	./bin/docker-agent serve chat ./examples/42.yaml
+//	# It listens on http://127.0.0.1:8083 by default.
+//
+// Then run this client:
+//
+//	go run ./examples/chat
+//	# or, to pin a specific agent in a multi-agent team:
+//	go run ./examples/chat -model root
+//	# or, to point at a different server:
+//	go run ./examples/chat -base http://127.0.0.1:9090/v1
+//
+// Type a message and press <Enter>. Type "exit" (or send EOF with ^D) to
+// quit.
+package main
+
+import (
+	"bufio"
+	"context"
+	"errors"
+	"flag"
+	"fmt"
+	"io"
+	"log"
+	"os"
+	"os/signal"
+	"strings"
+	"syscall"
+
+	"github.com/openai/openai-go/v3"
+	"github.com/openai/openai-go/v3/option"
+)
+
+func main() {
+	baseURL := flag.String("base", "http://127.0.0.1:8083/v1", "Base URL of the docker-agent chat server")
+	model := flag.String("model", "", "Agent name to talk to (defaults to the team's default agent)")
+	stream := flag.Bool("stream", true, "Stream the agent's response token-by-token")
+	flag.Parse()
+
+	ctx, cancel := signal.NotifyContext(context.Background(), syscall.SIGINT, syscall.SIGTERM)
+	err := run(ctx, *baseURL, *model, *stream)
+	cancel()
+	if err != nil && !errors.Is(err, context.Canceled) {
+		log.Fatal(err)
+	}
+}
+
+func run(ctx context.Context, baseURL, model string, stream bool) error {
+	// The chat server doesn't validate API keys, but the OpenAI SDK
+	// requires *some* string to be passed.
+	client := openai.NewClient(
+		option.WithBaseURL(baseURL),
+		option.WithAPIKey("not-needed"),
+	)
+
+	// Ask the server which agents are exposed and pick a default model
+	// when the user didn't pin one. This also doubles as a connectivity
+	// check.
+	if model == "" {
+		picked, err := pickDefaultModel(ctx, &client)
+		if err != nil {
+			return fmt.Errorf("listing models: %w", err)
+		}
+		model = picked
+	}
+	fmt.Printf("Connected to %s — chatting with %q. Type \"exit\" to quit.\n", baseURL, model)
+
+	// History keeps the conversation going across turns. The chat server
+	// is stateless: it builds a fresh session per request from whatever
+	// messages the client sends, so it's the client's job to remember.
+	var history []openai.ChatCompletionMessageParamUnion
+
+	in := bufio.NewScanner(os.Stdin)
+	in.Buffer(make([]byte, 0, 64*1024), 1024*1024)
+	for {
+		fmt.Print("\n> ")
+		if !in.Scan() {
+			if err := in.Err(); err != nil {
+				return err
+			}
+			fmt.Println()
+			return nil // EOF
+		}
+		userInput := strings.TrimSpace(in.Text())
+		if userInput == "" {
+			continue
+		}
+		if userInput == "exit" || userInput == "quit" {
+			return nil
+		}
+
+		history = append(history, openai.UserMessage(userInput))
+
+		reply, err := chat(ctx, &client, model, history, stream)
+		if err != nil {
+			return err
+		}
+		history = append(history, openai.AssistantMessage(reply))
+	}
+}
+
+// pickDefaultModel queries /v1/models and returns the first agent name
+// the server advertises.
+func pickDefaultModel(ctx context.Context, client *openai.Client) (string, error) {
+	page, err := client.Models.List(ctx)
+	if err != nil {
+		return "", err
+	}
+	if len(page.Data) == 0 {
+		return "", errors.New("server exposes no models")
+	}
+	return page.Data[0].ID, nil
+}
+
+// chat sends the conversation to the server, prints the assistant's reply
+// to stdout (streaming if requested) and returns the final assembled
+// content so the caller can append it to the history.
+func chat(
+	ctx context.Context,
+	client *openai.Client,
+	model string,
+	history []openai.ChatCompletionMessageParamUnion,
+	stream bool,
+) (string, error) {
+	params := openai.ChatCompletionNewParams{
+		Model:    model,
+		Messages: history,
+	}
+
+	if !stream {
+		resp, err := client.Chat.Completions.New(ctx, params)
+		if err != nil {
+			return "", err
+		}
+		if len(resp.Choices) == 0 {
+			return "", errors.New("server returned no choices")
+		}
+		content := resp.Choices[0].Message.Content
+		fmt.Println(content)
+		return content, nil
+	}
+
+	s := client.Chat.Completions.NewStreaming(ctx, params)
+	var b strings.Builder
+	for s.Next() {
+		chunk := s.Current()
+		if len(chunk.Choices) == 0 {
+			continue
+		}
+		delta := chunk.Choices[0].Delta.Content
+		if delta == "" {
+			continue
+		}
+		fmt.Print(delta)
+		b.WriteString(delta)
+	}
+	if err := s.Err(); err != nil && !errors.Is(err, io.EOF) {
+		return "", err
+	}
+	fmt.Println()
+	return b.String(), nil
+}
Original file line number	Diff line number	Diff line change
`@@ -13,8 +13,9 @@ func newServeCmd() *cobra.Command {`
`13`	`13`
`14`	`14`	`cmd.AddCommand(newA2ACmd())`
`15`	`15`	`cmd.AddCommand(newACPCmd())`
`16`		`- cmd.AddCommand(newMCPCmd())`
`17`	`16`	`cmd.AddCommand(newAPICmd())`
	`17`	`+ cmd.AddCommand(newChatCmd())`
	`18`	`+ cmd.AddCommand(newMCPCmd())`
`18`	`19`
`19`	`20`	`return cmd`
`20`	`21`	`}`