-
Notifications
You must be signed in to change notification settings - Fork 411
Expand file tree
/
Copy pathcompose.yaml
More file actions
73 lines (67 loc) · 2.13 KB
/
compose.yaml
File metadata and controls
73 lines (67 loc) · 2.13 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
services:
agents:
image: demo/agents
build:
context: agent
ports:
- 7777:7777
environment:
# point agents at the MCP gateway
- MCPGATEWAY_URL=http://mcp-gateway:8811
depends_on:
- mcp-gateway
volumes:
# mount the agents file
- ./agents.yaml:/agents.yaml
models:
qwen3-small:
endpoint_var: MODEL_RUNNER_URL
model_var: MODEL_RUNNER_MODEL
agents-ui:
image: demo/ui
build:
context: agent-ui
ports:
- 3000:3000
environment:
- AGENTS_URL=http://localhost:7777
depends_on:
- agents
mcp-gateway:
# mcp-gateway secures your MCP servers
image: docker/mcp-gateway:latest
# use docker API socket to start MCP servers
use_api_socket: true
command:
- --transport=streaming
# securely embed secrets into the gateway
- --secrets=docker-desktop:/run/secrets/mcp_secret
# add any MCP servers you want to use
- --servers=github-official
# add an interceptor to format and simplify the output of the GitHub issues tool
# this interceptor will convert the JSON output of the tool into a CSV format
secrets:
- mcp_secret
models:
qwen3-small:
# pre-pull the model when starting Docker Model Runner
# model: ai/qwen3:30B-A3B-Q4_K_M
model: ai/qwen3:8B-Q4_0 # 4.44 GB
context_size: 15000 # 7 GB VRAM
# increase context size to handle larger results
# context_size: 41000 # 13 GB VRAM
qwen3-medium:
model: ai/qwen3:14B-Q6_K # 11.28 GB
context_size: 15000 # 15 GB VRAM
# increase context size to handle larger results
# context_size: 41000 # 21 GB VRAM
# The qwen3-large model is defined in compose.offload.yaml
# because it requires more resources and is intended to run with Docker Offload.
# A recommended practice with Docker Compose is to isolate specialized configurations
# in override files. These files modify the base setup when applied,
# in our case:
# docker compose -f compose.yaml -f compose.offload.yaml up --build
# mount the secrets file for MCP servers
secrets:
mcp_secret:
file: ./.mcp.env