PlatformNetwork · echobt · Feb 3, 2026
diff --git a/docs/README.md b/docs/README.md
@@ -60,8 +60,8 @@ graph TB
     end
 
     subgraph LLM["LLM Layer"]
-        Client["LiteLLM Client"]
-        Provider["Provider (Chutes/OpenRouter)"]
+        Client["LLM Client"]
+        Provider["Chutes API"]
     end
 
     subgraph Tools["Tool System"]
@@ -91,7 +91,7 @@ graph TB
 - **Prompt Caching** - 90%+ cache hit rate for significant cost reduction
 - **Context Management** - Intelligent pruning and compaction for long tasks
 - **Self-Verification** - Automatic validation before task completion
-- **Multi-Provider** - Supports Chutes AI, OpenRouter, and litellm-compatible providers
+- **Chutes API** - Uses Chutes AI with OpenAI-compatible API format
 
 ---
 
@@ -105,7 +105,7 @@ baseagent/
 │   │   ├── loop.py          # Main agent loop
 │   │   └── compaction.py    # Context management
 │   ├── llm/
-│   │   └── client.py        # LLM client (litellm)
+│   │   └── client.py        # LLM client (httpx)
 │   ├── config/
 │   │   └── defaults.py      # Configuration
 │   ├── tools/               # Tool implementations

diff --git a/docs/architecture.md b/docs/architecture.md
@@ -18,7 +18,7 @@ graph TB
     end
 
     subgraph LLM["LLM Layer"]
-        client["client.py<br/>LiteLLM Client"]
+        client["client.py<br/>httpx Client"]
     end
 
     subgraph Config["Configuration"]
@@ -71,7 +71,7 @@ classDiagram
         +log(msg)
     }
 
-    class LiteLLMClient {
+    class LLMClient {
         +model: str
         +temperature: float
         +max_tokens: int
@@ -105,8 +105,8 @@ classDiagram
         +inject_content: Optional
     }
 
-    AgentContext --> LiteLLMClient : uses
-    LiteLLMClient --> LLMResponse : returns
+    AgentContext --> LLMClient : uses
+    LLMClient --> LLMResponse : returns
     LLMResponse --> FunctionCall : contains
     AgentContext --> ToolRegistry : uses
     ToolRegistry --> ToolResult : returns
@@ -171,13 +171,13 @@ sequenceDiagram
     participant Loop as loop.py
     participant Context as compaction.py
     participant Cache as Prompt Cache
-    participant LLM as LiteLLM Client
+    participant LLM as httpx Client
     participant Provider as API Provider
     participant Tools as Tool Registry
 
     User->>Entry: --instruction "Create hello.txt"
     Entry->>Entry: Initialize AgentContext
-    Entry->>Entry: Initialize LiteLLMClient
+    Entry->>Entry: Initialize LLMClient
     Entry->>Loop: run_agent_loop()
 
     Loop->>Loop: Build messages [system, user, state]
@@ -261,8 +261,8 @@ Intelligent context management that:
 
 ### `src/llm/client.py` - LLM Client
 
-LiteLLM-based client that:
-- Supports multiple providers (Chutes, OpenRouter, etc.)
+httpx-based client that:
+- Uses Chutes API (OpenAI-compatible)
 - Tracks token usage and costs
 - Handles tool/function calling format
 - Enforces cost limits