This commit is contained in:
ViperEkura 2026-04-25 14:53:48 +08:00
parent 20e73c05e0
commit cf545ffc04
12 changed files with 1221 additions and 692 deletions

View File

@ -18,7 +18,7 @@
```json ```json
{ {
"success": true, "success": true,
"message": "注册成功", "message": "Registration successful",
"data": { "data": {
"id": 1, "id": 1,
"username": "string" "username": "string"
@ -41,19 +41,31 @@
```json ```json
{ {
"success": true, "success": true,
"message": "登录成功", "message": "Login successful",
"data": { "data": {
"access_token": "eyJ...", "access_token": "eyJ...",
"token_type": "bearer", "token_type": "bearer",
"user": { "user": {
"id": 1, "id": 1,
"username": "string", "username": "string",
"role": "user" "email": "user@example.com",
"role": "user",
"permission_level": 1,
"workspace_path": null,
"is_active": true
} }
} }
} }
``` ```
**用户权限级别:**
| 级别 | 名称 | 说明 |
|------|------|------|
| 1 | READ_ONLY | 只读权限 |
| 2 | WRITE | 写入权限 |
| 3 | EXECUTE | 执行权限 |
| 4 | ADMIN | 管理员权限 |
### POST /api/auth/logout ### POST /api/auth/logout
用户登出 用户登出
@ -63,7 +75,7 @@
```json ```json
{ {
"success": true, "success": true,
"message": "登出成功" "message": "Logout successful"
} }
``` ```
@ -81,11 +93,39 @@
"username": "string", "username": "string",
"email": "user@example.com", "email": "user@example.com",
"role": "user", "role": "user",
"is_active": true "permission_level": 1,
"workspace_path": null,
"is_active": true,
"created_at": "2024-01-01T00:00:00"
} }
} }
``` ```
### GET /api/auth/users
获取所有用户(管理员专用)
**请求头:** `Authorization: Bearer <token>`
**响应:**
```json
{
"success": true,
"data": {
"users": [...]
}
}
```
### PUT /api/auth/users/{user_id}
更新用户权限(管理员专用)
**请求体:**
```json
{
"permission_level": 2
}
```
--- ---
## 会话 `/api/conversations` ## 会话 `/api/conversations`
@ -123,10 +163,11 @@
{ {
"project_id": "string (可选)", "project_id": "string (可选)",
"title": "新会话", "title": "新会话",
"model": "glm-5", "model": "deepseek-chat",
"system_prompt": "string (可选)", "provider_id": 1,
"temperature": 1.0, "system_prompt": "You are a helpful assistant. (可选)",
"max_tokens": 65536, "temperature": 0.7,
"max_tokens": 2000,
"thinking_enabled": false "thinking_enabled": false
} }
``` ```
@ -139,9 +180,15 @@
"data": { "data": {
"id": "conv_xxx", "id": "conv_xxx",
"user_id": 1, "user_id": 1,
"provider_id": 1,
"title": "新会话", "title": "新会话",
"model": "glm-5", "model": "deepseek-chat",
... "system_prompt": "You are a helpful assistant.",
"temperature": 0.7,
"max_tokens": 2000,
"thinking_enabled": false,
"created_at": "2024-01-01T00:00:00",
"updated_at": "2024-01-01T00:00:00"
} }
} }
``` ```
@ -149,32 +196,92 @@
### GET /api/conversations/{id} ### GET /api/conversations/{id}
获取会话详情 获取会话详情
**路径参数:** **路径参数:** `id`: 会话ID
- `id`: 会话ID
**请求头:** `Authorization: Bearer <token>` **请求头:** `Authorization: Bearer <token>`
### PUT /api/conversations/{id} ### PUT /api/conversations/{id}
更新会话 更新会话
**路径参数:** `id`: 会话ID
**请求头:** `Authorization: Bearer <token>`
**请求体:**
```json
{
"title": "新标题",
"model": "gpt-4",
"provider_id": 1,
"system_prompt": "You are...",
"temperature": 0.8,
"max_tokens": 4000,
"thinking_enabled": true
}
```
### DELETE /api/conversations/{id} ### DELETE /api/conversations/{id}
删除会话 删除会话
**路径参数:** `id`: 会话ID
**请求头:** `Authorization: Bearer <token>`
--- ---
## 消息 `/api/messages` ## 消息 `/api/messages`
### GET /api/messages/{conversation_id} ### GET /api/messages/
获取消息列表 获取消息列表
**路径参数:**
- `conversation_id`: 会话ID
**查询参数:** **查询参数:**
- `conversation_id`: 会话ID必需
- `limit` (可选): 返回数量默认100 - `limit` (可选): 返回数量默认100
**请求头:** `Authorization: Bearer <token>` **请求头:** `Authorization: Bearer <token>`
**响应:**
```json
{
"success": true,
"data": {
"messages": [
{
"id": "msg_xxx",
"conversation_id": "conv_xxx",
"role": "user",
"content": "用户消息",
"text": "用户消息",
"attachments": [],
"process_steps": [],
"token_count": 10,
"usage": null,
"created_at": "2024-01-01T00:00:00"
},
{
"id": "msg_yyy",
"conversation_id": "conv_xxx",
"role": "assistant",
"content": "AI 回复文本内容",
"text": "AI 回复文本内容",
"attachments": [],
"process_steps": [
{"id": "step-0", "index": 0, "type": "thinking", "content": "让我思考..."},
{"id": "step-1", "index": 1, "type": "text", "content": "根据搜索结果..."},
{"id": "step-2", "index": 2, "type": "tool_call", "id_ref": "call_xxx", "name": "web_search", "arguments": "..."},
{"id": "step-3", "index": 3, "type": "tool_result", "id_ref": "call_xxx", "name": "web_search", "content": "...", "success": true}
],
"token_count": 100,
"usage": {"prompt_tokens": 50, "completion_tokens": 50, "total_tokens": 100},
"created_at": "2024-01-01T00:00:01"
}
],
"title": "会话标题",
"first_message": "用户的第一条消息..."
}
}
```
### POST /api/messages/ ### POST /api/messages/
发送消息(非流式) 发送消息(非流式)
@ -185,7 +292,7 @@
{ {
"conversation_id": "conv_xxx", "conversation_id": "conv_xxx",
"content": "用户消息", "content": "用户消息",
"tools_enabled": true "thinking_enabled": false
} }
``` ```
@ -201,20 +308,182 @@
``` ```
### POST /api/messages/stream ### POST /api/messages/stream
发送消息(流式响应) 发送消息(流式响应 - SSE
使用 Server-Sent Events (SSE) 返回流式响应。 使用 Server-Sent Events (SSE) 返回流式响应。
**事件类型:** **请求头:** `Authorization: Bearer <token>`
- `text`: 文本增量
- `tool_call`: 工具调用
- `tool_result`: 工具结果
- `done`: 完成
- `error`: 错误
### DELETE /api/messages/{id} **请求体:**
```json
{
"conversation_id": "conv_xxx",
"content": "用户消息",
"thinking_enabled": true,
"enabled_tools": ["web_search", "file_read", "python_execute"]
}
```
**SSE 事件类型:**
#### process_step
结构化步骤事件(渲染顺序的唯一数据源)
```json
event: process_step
data: {"step": {"id": "step-0", "index": 0, "type": "thinking", "content": "让我思考一下..."}}
event: process_step
data: {"step": {"id": "step-1", "index": 1, "type": "text", "content": "以下是搜索结果:"}}
event: process_step
data: {"step": {"id": "step-2", "index": 2, "type": "tool_call", "id_ref": "call_abc", "name": "web_search", "arguments": "{\"query\": \"...\"}"}}
event: process_step
data: {"step": {"id": "step-3", "index": 3, "type": "tool_result", "id_ref": "call_abc", "name": "web_search", "content": "{...}", "success": true}}
```
**步骤类型说明:**
| type | 说明 | 额外字段 |
|------|------|---------|
| `thinking` | 模型思考过程 | `content` |
| `text` | 文本回复 | `content` |
| `tool_call` | 工具调用 | `id_ref`, `name`, `arguments` |
| `tool_result` | 工具执行结果 | `id_ref`, `name`, `content`, `success` |
#### done
响应完成
```json
event: done
data: {"message_id": "msg_xxx", "token_count": 150, "usage": {"prompt_tokens": 100, "completion_tokens": 50, "total_tokens": 150}}
```
#### error
错误信息
```json
event: error
data: {"content": "错误信息描述"}
```
### DELETE /api/messages/{message_id}
删除消息 删除消息
**路径参数:** `message_id`: 消息ID
**请求头:** `Authorization: Bearer <token>`
---
## LLM 提供商 `/api/providers`
### GET /api/providers/
获取用户的 LLM 提供商列表
**请求头:** `Authorization: Bearer <token>`
**响应:**
```json
{
"success": true,
"data": {
"providers": [
{
"id": 1,
"user_id": 1,
"name": "DeepSeek",
"provider_type": "openai",
"base_url": "https://api.deepseek.com/v1",
"default_model": "deepseek-chat",
"max_tokens": 8192,
"is_default": true,
"enabled": true,
"created_at": "2024-01-01T00:00:00",
"updated_at": "2024-01-01T00:00:00"
}
],
"total": 1
}
}
```
### POST /api/providers/
创建 LLM 提供商
**请求头:** `Authorization: Bearer <token>`
**请求体:**
```json
{
"name": "DeepSeek",
"provider_type": "openai",
"base_url": "https://api.deepseek.com/v1",
"api_key": "sk-xxxx",
"default_model": "deepseek-chat",
"is_default": true
}
```
**provider_type 可选值:**
- `openai` - OpenAI/DeepSeek/GLM 兼容 API
- `anthropic` - Anthropic Claude API
### GET /api/providers/{provider_id}
获取提供商详情
**路径参数:** `provider_id`: 提供商ID
**请求头:** `Authorization: Bearer <token>`
### PUT /api/providers/{provider_id}
更新提供商
**路径参数:** `provider_id`: 提供商ID
**请求头:** `Authorization: Bearer <token>`
**请求体:**
```json
{
"name": "新名称",
"base_url": "https://api.example.com/v1",
"api_key": "sk-yyyy",
"default_model": "gpt-4",
"max_tokens": 16384,
"is_default": false,
"enabled": true
}
```
### DELETE /api/providers/{provider_id}
删除提供商
**路径参数:** `provider_id`: 提供商ID
**请求头:** `Authorization: Bearer <token>`
### POST /api/providers/{provider_id}/test
测试提供商连接
**路径参数:** `provider_id`: 提供商ID
**请求头:** `Authorization: Bearer <token>`
**响应:**
```json
{
"success": true,
"message": "HTTP 200: ...",
"data": {
"status_code": 200,
"success": true,
"response_body": "..."
}
}
```
--- ---
## 工具 `/api/tools` ## 工具 `/api/tools`
@ -223,7 +492,7 @@
获取可用工具列表 获取可用工具列表
**查询参数:** **查询参数:**
- `category` (可选): 工具分类 - `category` (可选): 工具分类code/file/shell/crawler/data
**请求头:** `Authorization: Bearer <token>` **请求头:** `Authorization: Bearer <token>`
@ -232,12 +501,21 @@
{ {
"success": true, "success": true,
"data": { "data": {
"tools": [...], "tools": [
{
"name": "python_execute",
"description": "Execute Python code",
"category": "code",
"parameters": {...}
},
...
],
"categorized": { "categorized": {
"crawler": [...],
"code": [...], "code": [...],
"data": [...], "file": [...],
"weather": [...] "shell": [...],
"crawler": [...],
"data": [...]
}, },
"total": 11 "total": 11
} }
@ -247,9 +525,39 @@
### GET /api/tools/{name} ### GET /api/tools/{name}
获取工具详情 获取工具详情
**路径参数:** `name`: 工具名称
**请求头:** `Authorization: Bearer <token>`
**响应:**
```json
{
"success": true,
"data": {
"name": "web_search",
"description": "Search the web using DuckDuckGo",
"category": "crawler",
"parameters": {
"type": "object",
"properties": {
"query": {
"type": "string",
"description": "Search query"
}
},
"required": ["query"]
}
}
}
```
### POST /api/tools/{name}/execute ### POST /api/tools/{name}/execute
手动执行工具 手动执行工具
**路径参数:** `name`: 工具名称
**请求头:** `Authorization: Bearer <token>`
**请求体:** **请求体:**
```json ```json
{ {
@ -257,3 +565,89 @@
"arg2": "value2" "arg2": "value2"
} }
``` ```
**响应:**
```json
{
"success": true,
"data": {
"result": "..."
}
}
```
---
## 公共端点
### GET /api/health
健康检查
**响应:**
```json
{
"status": "ok",
"message": "Luxx API is running"
}
```
### GET /api/
服务信息
**响应:**
```json
{
"name": "Luxx",
"version": "1.0.0",
"description": "AI Chat API"
}
```
---
## 工具说明
### 内置工具
#### 代码执行 (code)
| 工具 | 功能 | 权限 |
|------|------|------|
| `python_execute` | 执行 Python 代码 | EXECUTE |
| `python_eval` | 计算表达式 | EXECUTE |
#### 文件操作 (file)
| 工具 | 功能 | 权限 |
|------|------|------|
| `file_read` | 读取文件内容 | READ_ONLY |
| `file_write` | 写入文件内容 | WRITE |
| `file_list` | 列出目录内容 | READ_ONLY |
| `file_exists` | 检查文件是否存在 | READ_ONLY |
| `file_grep` | 正则搜索文件 | READ_ONLY |
#### Shell 命令 (shell)
| 工具 | 功能 | 权限 |
|------|------|------|
| `shell_execute` | 执行 Shell 命令 | EXECUTE |
#### 网页爬虫 (crawler)
| 工具 | 功能 | 权限 |
|------|------|------|
| `web_search` | DuckDuckGo 搜索 | READ_ONLY |
| `web_fetch` | 网页抓取 | READ_ONLY |
| `batch_fetch` | 批量并发抓取 | READ_ONLY |
#### 数据处理 (data)
| 工具 | 功能 | 权限 |
|------|------|------|
| `process_data` | JSON 转换、格式化 | READ_ONLY |
### 权限检查
工具执行时自动检查用户权限:
```
工具要求的权限 <= 用户拥有的权限 → 允许执行
工具要求的权限 > 用户拥有的权限 → 返回错误
```
用户通过 `/api/auth/users/{user_id}` 接口设置权限级别。

View File

@ -17,39 +17,50 @@
``` ```
luxx/ luxx/
├── __init__.py # FastAPI 应用工厂 ├── __init__.py # FastAPI 应用工厂
├── config.py # 配置管理YAML ├── config.py # 配置管理YAML
├── database.py # 数据库连接 ├── database.py # 数据库连接
├── models.py # ORM 模型 ├── models.py # ORM 模型
├── routes/ # API 路由层 ├── routes/ # API 路由层
│ ├── __init__.py # 路由聚合 │ ├── __init__.py # 路由聚合
│ ├── auth.py # 认证 (登录/注册) │ ├── auth.py # 认证 (登录/注册)
│ ├── conversations.py # 会话管理 (CRUD) │ ├── conversations.py # 会话管理 (CRUD)
│ ├── messages.py # 消息处理 (流式/同步) │ ├── messages.py # 消息处理 (流式/同步)
│ ├── providers.py # LLM 提供商管理 │ ├── providers.py # LLM 提供商管理
│ └── tools.py # 工具管理 │ └── tools.py # 工具管理
├── services/ # 服务层 ├── services/ # 服务层
│ ├── chat.py # 聊天服务门面 │ ├── __init__.py # 服务导出
│ ├── agentic_loop.py # Agentic Loop 执行器 │ ├── chat.py # 聊天服务门面
│ ├── stream_context.py# 流式状态管理 │ ├── agentic_loop.py # Agentic Loop 执行器
│ ├── llm_response.py # LLM 响应解析器 │ ├── stream_context.py # 流式状态管理
│ ├── process_result.py# 处理结果 │ ├── llm_response.py # LLM 响应数据类
│ └── llm_client.py # LLM 客户端 │ ├── process_result.py # [已移除]
├── tools/ # 工具系统 │ ├── task.py # 任务系统 (Task/TaskGraph/TaskService)
│ ├── core.py # 核心类 (ToolRegistry, ToolDefinition, ToolResult) │ ├── llm_client.py # LLM 客户端
│ ├── factory.py # @tool 装饰器 │ └── llm_adapters/ # LLM API 适配器
│ ├── executor.py # 工具执行器 (缓存/并行) │ ├── __init__.py # 适配器导出
│ ├── services.py # 工具服务层 │ ├── base.py # ProviderAdapter 基类
│ └── builtin/ # 内置工具 │ ├── openai_adapter.py # OpenAI/DeepSeek/GLM 适配器
│ ├── __init__.py # 工具注册入口 │ └── anthropic_adapter.py # Anthropic Claude 适配器
│ ├── code.py # 代码执行 (python_execute, python_eval) ├── tools/ # 工具系统
│ ├── crawler.py # 网页爬虫 (web_search, web_fetch, batch_fetch) │ ├── __init__.py # 工具注册入口
│ └── data.py # 数据处理 (process_data) │ ├── core.py # 核心类 (ToolRegistry, ToolDefinition, ToolResult, ToolContext)
└── utils/ # 工具函数 │ ├── factory.py # @tool 装饰器
└── helpers.py # 密码哈希、ID生成、响应封装 │ ├── executor.py # 工具执行器 (缓存/并行)
│ ├── services.py # 工具服务层
│ └── builtin/ # 内置工具
│ ├── __init__.py # 工具注册入口
│ ├── code.py # 代码执行 (python_execute, python_eval)
│ ├── crawler.py # 网页爬虫 (web_search, web_fetch, batch_fetch)
│ ├── data.py # 数据处理 (process_data)
│ ├── file.py # 文件操作 (file_read, file_write, file_list, file_exists, file_grep)
│ └── shell.py # Shell 命令 (shell_execute)
└── utils/ # 工具函数
├── __init__.py
└── helpers.py # 密码哈希、ID生成、响应封装
run.py # 应用入口文件 run.py # 应用入口文件
config.yaml # 配置文件 config.yaml # 配置文件
``` ```
## 核心组件 ## 核心组件
@ -77,15 +88,36 @@ password: admin123
app: app:
secret_key: ${APP_SECRET_KEY} secret_key: ${APP_SECRET_KEY}
debug: true debug: true
host: 0.0.0.0
port: 8000
database: database:
type: sqlite type: sqlite
url: sqlite:///./chat.db url: sqlite:///./chat.db
workspace:
root: ./workspaces # 用户工作空间根目录
auto_create: true # 自动创建用户目录
llm: llm:
provider: deepseek provider: deepseek
api_key: ${DEEPSEEK_API_KEY} api_key: ${DEEPSEEK_API_KEY}
api_url: https://api.deepseek.com/v1 api_url: https://api.deepseek.com/v1
tools:
enable_cache: true
cache_ttl: 300
max_workers: 4
max_iterations: 10
logging:
level: INFO
```
**工作空间隔离机制:**
- 每个用户的工作空间路径基于 `user_id` 的 SHA256 哈希值
- 格式:`{workspace_root}/{hash_of_user_id}`
- 所有文件操作必须在用户工作空间内,防止路径穿越攻击
``` ```
### 3. 数据库 (`database.py`) ### 3. 数据库 (`database.py`)
@ -103,6 +135,8 @@ erDiagram
string email UK string email UK
string password_hash string password_hash
string role string role
int permission_level "1=READ_ONLY, 2=WRITE, 3=EXECUTE, 4=ADMIN"
string workspace_path "用户工作空间路径"
boolean is_active boolean is_active
datetime created_at datetime created_at
} }
@ -164,6 +198,14 @@ erDiagram
CONVERSATION ||--o{ MESSAGE : "has" CONVERSATION ||--o{ MESSAGE : "has"
``` ```
**用户权限级别 (permission_level)**
| 级别 | 名称 | 说明 |
|------|------|------|
| 1 | READ_ONLY | 只读权限 |
| 2 | WRITE | 写入权限(文件写入) |
| 3 | EXECUTE | 执行权限代码执行、Shell命令 |
| 4 | ADMIN | 管理员权限 |
### Message Content JSON 结构 ### Message Content JSON 结构
`content` 字段统一使用 JSON 格式存储: `content` 字段统一使用 JSON 格式存储:
@ -183,8 +225,6 @@ erDiagram
```json ```json
{ {
"text": "AI 回复的文本内容",
"tool_calls": [...],
"steps": [ "steps": [
{"id": "step-0", "index": 0, "type": "thinking", "content": "..."}, {"id": "step-0", "index": 0, "type": "thinking", "content": "..."},
{"id": "step-1", "index": 1, "type": "text", "content": "..."}, {"id": "step-1", "index": 1, "type": "text", "content": "..."},
@ -194,7 +234,9 @@ erDiagram
} }
``` ```
`steps` 字段是**渲染顺序的唯一数据源**,按 `index` 顺序排列。thinking、text、tool_call、tool_result 可以在多轮迭代中穿插出现。 `steps` 字段是**唯一数据源**,按 `index` 顺序排列。thinking、text、tool_call、tool_result 可以在多轮迭代中穿插出现。
**注意**`text` 和 `content` 字段通过解析 `steps` 中所有 `type: "text"` 的内容动态计算得出。
### 5. 工具系统 ### 5. 工具系统
@ -206,9 +248,25 @@ classDiagram
+dict parameters +dict parameters
+Callable handler +Callable handler
+str category +str category
+CommandPermission required_permission
+to_openai_format() dict +to_openai_format() dict
} }
class ToolContext {
+int user_id
+str username
+str workspace
+int user_permission_level
}
class CommandPermission {
<<enumeration>>
READ_ONLY = 1
WRITE = 2
EXECUTE = 3
ADMIN = 4
}
class ToolResult { class ToolResult {
+bool success +bool success
+Any data +Any data
@ -224,7 +282,7 @@ classDiagram
+get(name) ToolDefinition? +get(name) ToolDefinition?
+list_all() List~dict~ +list_all() List~dict~
+list_by_category(category) List~dict~ +list_by_category(category) List~dict~
+execute(name, arguments) dict +execute(name, arguments, context) dict
+remove(name) bool +remove(name) bool
} }
@ -243,14 +301,51 @@ classDiagram
#### 内置工具 #### 内置工具
| 工具 | 功能 | 说明 | **代码执行 (code.py)**
| 工具 | 功能 | 权限 |
|------|------|------| |------|------|------|
| `python_execute` | 执行 Python 代码 | 支持 print 输出、变量访问 | | `python_execute` | 执行 Python 代码 | EXECUTE |
| `python_eval` | 计算表达式 | 快速求值 | | `python_eval` | 计算表达式 | EXECUTE |
| `web_search` | DuckDuckGo HTML | DuckDuckGo HTML 搜索 |
| `web_fetch` | 网页抓取 | httpx + BeautifulSoup支持 text/links/structured | **文件操作 (file.py)**
| `batch_fetch` | 批量抓取 | 并发获取多个页面 |
| `process_data` | 数据处理 | JSON 转换、格式化等 | | 工具 | 功能 | 权限 |
|------|------|------|
| `file_read` | 读取文件内容 | READ_ONLY |
| `file_write` | 写入文件内容 | WRITE |
| `file_list` | 列出目录内容 | READ_ONLY |
| `file_exists` | 检查文件是否存在 | READ_ONLY |
| `file_grep` | 正则搜索文件内容 | READ_ONLY |
**Shell 命令 (shell.py)**
| 工具 | 功能 | 权限 |
|------|------|------|
| `shell_execute` | 执行 Shell 命令 | EXECUTE |
**网页爬虫 (crawler.py)**
| 工具 | 功能 | 权限 |
|------|------|------|
| `web_search` | DuckDuckGo HTML 搜索 | READ_ONLY |
| `web_fetch` | 网页抓取 | READ_ONLY |
| `batch_fetch` | 批量并发抓取 | READ_ONLY |
**数据处理 (data.py)**
| 工具 | 功能 | 权限 |
|------|------|------|
| `process_data` | JSON 转换、格式化 | READ_ONLY |
#### 权限检查机制
工具执行时自动检查用户权限:
```
工具要求的权限 <= 用户拥有的权限 → 允许执行
工具要求的权限 > 用户拥有的权限 → 拒绝执行
```
#### 工具开发规范 #### 工具开发规范
@ -312,26 +407,82 @@ ToolExecutor 返回结果
### 6. 服务层 ### 6. 服务层
#### LLMResponseParser (`services/llm_response.py`) #### LLM 适配器 (`services/llm_adapters/`)
统一解析器,兼容多种 LLM API 格式:
- **OpenAI**: `delta.content`, `delta.tool_calls` 适配器模式统一处理不同 LLM API 格式:
- **DeepSeek**: `delta.content`, `delta.reasoning_content`
- **Anthropic**: `content_block` 类型事件 ```mermaid
- **MiniMax**: `<|im_start|>thinking...<|im_end|>` 标签 classDiagram
class ProviderAdapter {
<<abstract>>
+str provider_type
+build_request() tuple
+parse_stream_chunk() AsyncGenerator
+parse_response() Dict
+supports_thinking() bool
+supports_tools() bool
}
class OpenAIAdapter {
+str provider_type = "openai"
+build_request() tuple
+parse_stream_chunk() AsyncGenerator
+parse_response() Dict
+supports_tools() bool
}
class AnthropicAdapter {
+str provider_type = "anthropic"
+build_request() tuple
+parse_stream_chunk() AsyncGenerator
+parse_response() Dict
+supports_thinking() bool
+supports_tools() bool
}
ProviderAdapter <|-- OpenAIAdapter
ProviderAdapter <|-- AnthropicAdapter
```
**支持的功能对比:**
| 适配器 | 工具调用 | Thinking/Reasoning | 流式响应 |
|--------|----------|-------------------|----------|
| OpenAI | ✅ | ✅ (DeepSeek) | ✅ |
| Anthropic | ✅ | ✅ | ✅ |
#### LLM 响应数据类 (`services/llm_response.py`)
```python ```python
from luxx.services.llm_response import llm_parser class StepType:
"""步骤类型常量"""
THINKING = "thinking"
TEXT = "text"
TOOL_CALL = "tool_call"
TOOL_RESULT = "tool_result"
# 解析 OpenAI 格式
parsed = llm_parser.parse_openai(delta)
# 解析 Anthropic 格式 @dataclass
parsed = llm_parser.parse_anthropic(chunk) class Step:
"""单个步骤 - 用于存储和传输"""
id: str
index: int
type: str # thinking, text, tool_call, tool_result
content: str = ""
name: str = "" # tool_call/tool_result
arguments: str = "" # tool_call
id_ref: str = "" # tool_result
success: bool = True
# 返回 ParsedDelta
parsed.thinking # 思考内容 @dataclass
parsed.text # 文本内容 class ParsedDelta:
parsed.tool_calls # 工具调用 """LLM 流式响应增量"""
thinking: str = "" # 思考内容(增量)
text: str = "" # 文本内容(增量)
tool_call: Optional[Dict] = None # 单个工具调用
usage: Dict[str, int] = {} # Token 用量
is_complete: bool = False
``` ```
#### ChatService (`services/chat.py`) #### ChatService (`services/chat.py`)
@ -340,30 +491,101 @@ parsed.tool_calls # 工具调用
- 流式 SSE 响应 - 流式 SSE 响应
- 工具调用编排(并行执行) - 工具调用编排(并行执行)
- 消息历史管理 - 消息历史管理
- 自动重试机制
- Token 用量追踪 - Token 用量追踪
- 工作空间上下文传递
#### AgenticLoop (`services/agentic_loop.py`) #### AgenticLoop (`services/agentic_loop.py`)
执行 Agentic Loop 的核心循环: 执行 Agentic Loop 的核心循环:
- 调用 LLM 获取响应 - 调用 LLM 获取响应(流式)
- 使用 LLMResponseParser 解析响应 - 解析 ParsedDelta更新步骤状态
- 管理 thinking/text/tool_call/tool_result 步骤 - 管理 thinking/text/tool_call/tool_result 步骤
- 工具并行执行 - 工具并行执行
- 最大迭代次数10
```python
# 执行流程
async for delta in llm.stream_call(...):
events = self._process_delta(delta, context, total_usage)
yield from events
# 工具调用时
tool_results = self.tool_executor.process_tool_calls_parallel(...)
messages.append({"role": "assistant", ...})
messages.extend(tool_results)
```
#### StreamContext (`services/stream_context.py`) #### StreamContext (`services/stream_context.py`)
流式状态管理: 流式状态管理:
- 追踪当前步骤类型和索引 - 追踪当前步骤类型和索引
- 累积 thinking 和 text 内容 - 累积 thinking 和 text 内容
- 管理 tool_calls 列表 - 管理 tool_calls 列表和 tool_results
- 生成 SSE 事件 - 生成 SSE 事件
- 构建完整消息内容
#### LLMClient (`services/llm_client.py`) #### LLMClient (`services/llm_client.py`)
LLM API 客户端: LLM API 客户端:
- 多提供商DeepSeek、GLM、OpenAI - 多提供商OpenAI、DeepSeek、Anthropic
- 自动适配器选择
- 流式/同步调用 - 流式/同步调用
- 错误处理和重试 - 错误处理和重试
- Token 计数 - Token 计数
### 7. 任务系统 (`services/task.py`)
用于自主任务执行和依赖管理:
```mermaid
classDiagram
class Task {
+str id
+str name
+str goal
+TaskStatus status
+List~Step~ steps
+List~Task~ subtasks
}
class Step {
+str id
+str name
+List~str~ depends_on
+StepStatus status
}
class TaskGraph {
+topological_sort() List~Step~
+get_ready_steps() List~Step~
+detect_cycles() List~List~str~~
+validate() tuple
}
class TaskService {
+create_task() Task
+get_task() Task
+update_task_status() Task
+add_steps() List~Step~
+build_graph() TaskGraph
}
Task "1" o-- "*" Step
Task "1" o-- "*" Task
TaskService ..> TaskGraph
```
**任务状态 (TaskStatus)**
- `PENDING` - 待处理
- `READY` - 就绪
- `RUNNING` - 运行中
- `BLOCK` - 阻塞
- `TERMINATED` - 已终止
**步骤状态 (StepStatus)**
- `PENDING` - 待执行
- `RUNNING` - 执行中
- `COMPLETED` - 已完成
- `FAILED` - 失败
- `SKIPPED` - 跳过
### 7. 认证系统 (`routes/auth.py`) ### 7. 认证系统 (`routes/auth.py`)
- JWT Bearer Token - JWT Bearer Token
- Bcrypt 密码哈希 - Bcrypt 密码哈希
@ -481,6 +703,10 @@ database:
type: sqlite type: sqlite
url: sqlite:///./chat.db url: sqlite:///./chat.db
workspace:
root: ./workspaces # 用户工作空间根目录
auto_create: true # 自动创建用户工作空间
llm: llm:
provider: deepseek provider: deepseek
api_key: ${DEEPSEEK_API_KEY} api_key: ${DEEPSEEK_API_KEY}
@ -491,6 +717,9 @@ tools:
cache_ttl: 300 cache_ttl: 300
max_workers: 4 max_workers: 4
max_iterations: 10 max_iterations: 10
logging:
level: INFO
``` ```
## 环境变量 ## 环境变量
@ -501,6 +730,26 @@ tools:
| `DEEPSEEK_API_KEY` | DeepSeek API | `sk-xxxx` | | `DEEPSEEK_API_KEY` | DeepSeek API | `sk-xxxx` |
| `DATABASE_URL` | 数据库连接 | `sqlite:///./chat.db` | | `DATABASE_URL` | 数据库连接 | `sqlite:///./chat.db` |
## LLM 适配器配置
### OpenAI 兼容 (DeepSeek/GLM 等)
```yaml
llm:
provider: openai
api_key: ${API_KEY}
api_url: https://api.deepseek.com/v1 # 或其他兼容端点
```
### Anthropic Claude
```yaml
llm:
provider: anthropic
api_key: ${ANTHROPIC_API_KEY}
api_url: https://api.anthropic.com/v1
```
## 项目结构说明 ## 项目结构说明
### 入口文件 ### 入口文件
@ -530,5 +779,21 @@ ToolExecutor 支持结果缓存:
1. 实时返回 thinking_content模型思考过程 1. 实时返回 thinking_content模型思考过程
2. 实时返回 text 增量更新 2. 实时返回 text 增量更新
3. 工具调用行执行,结果批量返回 3. 工具调用行执行,结果批量返回
4. 最终 `done` 事件包含完整 message_id 和 token 用量 4. 最终 `done` 事件包含完整 message_id 和 token 用量
### 工作空间隔离
每个用户的工作空间完全隔离:
- 用户目录基于 user_id 的 SHA256 哈希生成
- 所有文件操作强制在用户工作空间内
- 支持权限级别控制文件操作能力
### MessageBuilder
用于构建发送给 LLM 的消息列表:
- `add_system()` - 添加系统消息
- `add_user()` - 添加用户消息JSON 格式)
- `add_assistant()` - 添加助手消息
- `add_tool_result()` - 添加工具结果消息
- `extract_text()` - 从 JSON 内容中提取文本

View File

@ -154,8 +154,6 @@ class Message(Base):
**Assistant 消息** **Assistant 消息**
{ {
"text": "AI 回复的文本内容",
"tool_calls": [...], // 遗留的扁平结构
"steps": [ // 有序步骤用于渲染主要数据源 "steps": [ // 有序步骤用于渲染主要数据源
{"id": "step-0", "index": 0, "type": "thinking", "content": "..."}, {"id": "step-0", "index": 0, "type": "thinking", "content": "..."},
{"id": "step-1", "index": 1, "type": "text", "content": "..."}, {"id": "step-1", "index": 1, "type": "text", "content": "..."},
@ -163,6 +161,8 @@ class Message(Base):
{"id": "step-3", "index": 3, "type": "tool_result", "id_ref": "call_xxx", "name": "...", "content": "..."} {"id": "step-3", "index": 3, "type": "tool_result", "id_ref": "call_xxx", "name": "...", "content": "..."}
] ]
} }
注意to_dict() 返回时会从 steps 动态计算 text content 字段
""" """
__tablename__ = "messages" __tablename__ = "messages"
@ -204,20 +204,22 @@ class Message(Base):
result["content"] = self.content result["content"] = self.content
result["text"] = self.content result["text"] = self.content
result["attachments"] = [] result["attachments"] = []
result["tool_calls"] = []
result["process_steps"] = [] result["process_steps"] = []
return result return result
# Extract common fields
result["text"] = content_obj.get("text", "")
result["attachments"] = content_obj.get("attachments", [])
result["tool_calls"] = content_obj.get("tool_calls", [])
# Extract steps as process_steps for frontend rendering # Extract steps as process_steps for frontend rendering
result["process_steps"] = content_obj.get("steps", []) steps = content_obj.get("steps", [])
result["process_steps"] = steps
# For backward compatibility # Extract text from steps (concatenate all text type steps)
if "content" not in result: text_content = "".join(
result["content"] = result["text"] s.get("content", "") for s in steps
if s.get("type") == "text"
)
result["text"] = text_content
result["content"] = text_content # Alias for convenience
# Extract attachments
result["attachments"] = content_obj.get("attachments", [])
return result return result

View File

@ -1,4 +1,4 @@
"""Services module""" """Services module"""
from luxx.services.llm_client import LLMClient from luxx.services.llm_client import LLMClient
from luxx.services.llm_response import ParsedDelta, LLMResponse from luxx.services.llm_response import ParsedDelta, Step, StepType
from luxx.services.chat import ChatService, create_chat_service from luxx.services.chat import ChatService, create_chat_service

View File

@ -1,13 +1,5 @@
"""AgenticLoop - Executes the Agentic Loop: LLM + Tools iteration. """AgenticLoop - Executes the Agentic Loop: LLM + Tools iteration."""
The loop:
1. Call LLM with messages and tools
2. Check for tool calls in response
3. Execute tools in parallel
4. Add results to messages
5. Repeat (max 10 iterations)
6. Return final response
"""
import uuid import uuid
import logging import logging
from typing import List, Dict, AsyncGenerator from typing import List, Dict, AsyncGenerator
@ -15,21 +7,14 @@ from typing import List, Dict, AsyncGenerator
from luxx.tools.executor import ToolExecutor from luxx.tools.executor import ToolExecutor
from luxx.services.llm_client import LLMClient from luxx.services.llm_client import LLMClient
from luxx.services.stream_context import StreamContext, _sse_event from luxx.services.stream_context import StreamContext, _sse_event
from luxx.services.process_result import ProcessResult from luxx.services.llm_response import ParsedDelta, StepType
from luxx.services.llm_response import ParsedDelta
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)
# Maximum iterations to prevent infinite loops
MAX_ITERATIONS = 10 MAX_ITERATIONS = 10
class AgenticLoop: class AgenticLoop:
"""Executes the Agentic Loop: LLM + Tools iteration.
Supports multiple LLM Providers, auto-adapts response format.
"""
def __init__(self, tool_executor: ToolExecutor): def __init__(self, tool_executor: ToolExecutor):
self.tool_executor = tool_executor self.tool_executor = tool_executor
@ -45,17 +30,12 @@ class AgenticLoop:
context: 'StreamContext', context: 'StreamContext',
tool_context: dict = None tool_context: dict = None
) -> AsyncGenerator[str, None]: ) -> AsyncGenerator[str, None]:
"""Execute the agentic loop.
Yields SSE events for each step.
"""
total_usage = {"prompt_tokens": 0, "completion_tokens": 0, "total_tokens": 0} total_usage = {"prompt_tokens": 0, "completion_tokens": 0, "total_tokens": 0}
for iteration in range(MAX_ITERATIONS): for iteration in range(MAX_ITERATIONS):
context.reset() context.reset()
has_error = False has_error = False
# Stream LLM response - now yields ParsedDelta directly
async for delta in llm.stream_call( async for delta in llm.stream_call(
model=model, model=model,
messages=messages, messages=messages,
@ -64,38 +44,33 @@ class AgenticLoop:
max_tokens=max_tokens, max_tokens=max_tokens,
thinking_enabled=thinking_enabled thinking_enabled=thinking_enabled
): ):
# Process parsed delta events = self._process_delta(delta, context, total_usage)
result = self._process_delta(delta, context, total_usage) for event in events:
# Yield events
for event in result.events:
yield event yield event
# Check for errors if not delta.has_content() and not delta.is_complete:
if result.has_error:
has_error = True has_error = True
break break
# If error occurred, break the loop
if has_error: if has_error:
break break
# Finalize current step # Flush remaining content on complete
if delta.is_complete:
for event in self._flush_remaining(context):
yield event
context.finalize_step() context.finalize_step()
# Check for tool calls
if context.tool_calls_list: if context.tool_calls_list:
# Execute tools and yield events
for event in self._execute_tools(context, messages, tool_context): for event in self._execute_tools(context, messages, tool_context):
yield event yield event
continue continue
# No tools - complete
for event in self._complete(context, total_usage): for event in self._complete(context, total_usage):
yield event yield event
return return
# Max iterations exceeded or error occurred
if not has_error: if not has_error:
yield _sse_event("error", {"content": "Exceeded maximum tool call iterations"}) yield _sse_event("error", {"content": "Exceeded maximum tool call iterations"})
@ -104,25 +79,9 @@ class AgenticLoop:
delta: ParsedDelta, delta: ParsedDelta,
ctx: 'StreamContext', ctx: 'StreamContext',
total_usage: dict total_usage: dict
) -> ProcessResult: ) -> List[str]:
"""Process ParsedDelta from adapter, return result with events and flags. events = []
Args:
delta: ParsedDelta from LLM adapter
ctx: StreamContext for state management
total_usage: Accumulated token usage
Returns:
ProcessResult with events and flags
"""
result = ProcessResult()
# Check for error (empty delta with no content)
if not delta.has_content() and not delta.is_complete:
# Empty delta, possibly an error
return result
# Update usage
if delta.usage: if delta.usage:
total_usage.update({ total_usage.update({
"prompt_tokens": delta.usage.get("prompt_tokens", 0), "prompt_tokens": delta.usage.get("prompt_tokens", 0),
@ -130,73 +89,51 @@ class AgenticLoop:
"total_tokens": delta.usage.get("total_tokens", 0) "total_tokens": delta.usage.get("total_tokens", 0)
}) })
# Process thinking content (incremental) if delta.content:
if delta.thinking: result = ctx.process_content(delta.content)
logger.debug(f"Processing thinking: {delta.thinking[:50]}...") if result["should_emit"]:
ctx.full_thinking += delta.thinking # Accumulate incremental content # Only emit if there's content
if not ctx.current_step_id or ctx.current_step_type != "thinking": if result["thinking"]:
ctx.start_step("thinking") ctx.full_thinking += result["thinking"]
result.add_event(_sse_event("process_step", { ctx.start_step(StepType.THINKING)
"step": { events.append(ctx.emit_thinking())
"id": ctx.current_step_id,
"index": ctx.current_step_idx,
"type": "thinking",
"content": ctx.full_thinking
}
}))
result.set_content()
# Process text content (incremental) if result["text"]:
if delta.text: ctx.full_content += result["text"]
ctx.full_content += delta.text # Accumulate incremental content ctx.start_step(StepType.TEXT)
if not ctx.current_step_id or ctx.current_step_type != "text": events.append(ctx.emit_text())
ctx.start_step("text")
result.add_event(_sse_event("process_step", {
"step": {
"id": ctx.current_step_id,
"index": ctx.current_step_idx,
"type": "text",
"content": ctx.full_content
}
}))
result.set_content()
# Process tool calls # Clear buffers after emit
if delta.tool_calls: ctx._thinking_buf = ""
for tc in delta.tool_calls: ctx._text_buf = ""
ctx.accumulate_tool_call(tc)
result.set_tool_calls()
return result if delta.has_tool_call():
ctx.accumulate_tool_call(delta.tool_call)
return events
def _execute_tools(self, ctx: 'StreamContext', messages: list, def _execute_tools(self, ctx: 'StreamContext', messages: list,
tool_context: dict = None) -> List[str]: tool_context: dict = None) -> List[str]:
"""Execute tools and return list of events."""
events = [] events = []
# Emit tool call steps
for event in ctx.emit_tool_calls(): for event in ctx.emit_tool_calls():
events.append(event) events.append(event)
# Execute in parallel
tool_results = self.tool_executor.process_tool_calls_parallel( tool_results = self.tool_executor.process_tool_calls_parallel(
ctx.tool_calls_list, tool_context or {} ctx.tool_calls_list, tool_context or {}
) )
# Get tool call IDs for result linking
tool_ids = [tc.get("id") for tc in ctx.tool_calls_list] tool_ids = [tc.get("id") for tc in ctx.tool_calls_list]
tool_step_ids = [ tool_step_ids = [
s["id"] for s in ctx.all_steps s.id for s in ctx.all_steps
if s["type"] == "tool_call" and s.get("id_ref") in tool_ids if s.type == StepType.TOOL_CALL and s.id_ref in tool_ids
] ]
# Emit tool result steps
for i, (tr, tc) in enumerate(zip(tool_results, ctx.tool_calls_list)): for i, (tr, tc) in enumerate(zip(tool_results, ctx.tool_calls_list)):
ref_id = tool_step_ids[i] if i < len(tool_step_ids) else f"step-{len(ctx.all_steps) - len(tool_results) + i}" ref_id = tool_step_ids[i] if i < len(tool_step_ids) else f"step-{len(ctx.all_steps) - len(tool_results) + i}"
_, event = ctx.emit_tool_result(tr, ref_id) _, event = ctx.emit_tool_result(tr, ref_id)
events.append(event) events.append(event)
# Prepare for next iteration
messages.append({ messages.append({
"role": "assistant", "role": "assistant",
"content": ctx.full_content or "", "content": ctx.full_content or "",
@ -206,8 +143,24 @@ class AgenticLoop:
return events return events
def _flush_remaining(self, ctx: 'StreamContext') -> List[str]:
"""Flush remaining buffers on complete."""
events = []
thinking, text = ctx.flush()
if thinking:
ctx.full_thinking += thinking
ctx.start_step(StepType.THINKING)
events.append(ctx.emit_thinking())
ctx.finalize_step()
if text:
ctx.full_content += text
ctx.start_step(StepType.TEXT)
events.append(ctx.emit_text())
ctx.finalize_step()
return events
def _complete(self, ctx: 'StreamContext', total_usage: dict) -> List[str]: def _complete(self, ctx: 'StreamContext', total_usage: dict) -> List[str]:
"""Complete the loop and return list of events.""" # Note: buffers already flushed in _flush_remaining or _process_delta
token_count = total_usage.get("completion_tokens") or len(ctx.full_content) // 4 token_count = total_usage.get("completion_tokens") or len(ctx.full_content) // 4
msg_id = str(uuid.uuid4()) msg_id = str(uuid.uuid4())
logger.info(f"[TOKEN] usage={total_usage}, count={token_count}") logger.info(f"[TOKEN] usage={total_usage}, count={token_count}")

View File

@ -17,7 +17,6 @@ from luxx.tools.core import registry
from luxx.services.llm_client import LLMClient from luxx.services.llm_client import LLMClient
from luxx.services.stream_context import StreamContext from luxx.services.stream_context import StreamContext
from luxx.services.agentic_loop import AgenticLoop from luxx.services.agentic_loop import AgenticLoop
from luxx.config import config
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)
@ -199,15 +198,12 @@ class ChatService:
): ):
yield event yield event
# Save message after successful completion (only if we have content) # Save message after successful completion
if ctx._last_message_id and (ctx.full_content or ctx.all_tool_calls): if ctx._last_message_id and ctx.all_steps:
self._save_message( self._save_message(
conversation.id, conversation.id,
ctx._last_message_id, ctx._last_message_id,
ctx.full_content, ctx.get_steps_for_save(),
ctx.all_tool_calls,
ctx.all_tool_results,
ctx.all_steps,
ctx._last_token_count, ctx._last_token_count,
ctx._last_usage ctx._last_usage
) )
@ -223,7 +219,11 @@ class ChatService:
tools_enabled: bool = True, tools_enabled: bool = True,
thinking_enabled: bool = False thinking_enabled: bool = False
) -> Dict[str, Any]: ) -> Dict[str, Any]:
"""Non-streaming response for simple requests.""" """Non-streaming response for simple requests.
Note: For non-streaming, we return the raw LLM response.
Tool calls should be handled by the streaming endpoint.
"""
try: try:
messages = self.build_messages(conversation) messages = self.build_messages(conversation)
messages.append({ messages.append({
@ -246,9 +246,9 @@ class ChatService:
return { return {
"success": True, "success": True,
"content": response.content, "content": response.get("content", ""),
"tool_calls": response.tool_calls, "tool_calls": response.get("tool_calls", []),
"usage": response.usage "usage": response.get("usage", {})
} }
except httpx.HTTPStatusError as e: except httpx.HTTPStatusError as e:
@ -262,16 +262,13 @@ class ChatService:
logger.error(f"Non-stream error: {type(e).__name__}: {e}\n{traceback.format_exc()}") logger.error(f"Non-stream error: {type(e).__name__}: {e}\n{traceback.format_exc()}")
return {"success": False, "error": f"{type(e).__name__}: {str(e)}"} return {"success": False, "error": f"{type(e).__name__}: {str(e)}"}
def _save_message(self, conversation_id: str, msg_id: str, full_content: str, def _save_message(self, conversation_id: str, msg_id: str,
all_tool_calls: list, all_tool_results: list, all_steps: list, all_steps: list, token_count: int = 0, usage: dict = None):
token_count: int = 0, usage: dict = None):
"""Save assistant message to database.""" """Save assistant message to database."""
from luxx.database import SessionLocal from luxx.database import SessionLocal
from luxx.models import Message from luxx.models import Message
content_json = {"text": full_content, "steps": all_steps} content_json = {"steps": all_steps}
if all_tool_calls:
content_json["tool_calls"] = all_tool_calls
db = SessionLocal() db = SessionLocal()
try: try:

View File

@ -2,12 +2,13 @@
Supports Anthropic Claude API streaming and non-streaming responses. Supports Anthropic Claude API streaming and non-streaming responses.
""" """
import json import json
import logging import logging
from typing import Dict, List, Any, AsyncGenerator from typing import Dict, List, Any, AsyncGenerator
from .base import ProviderAdapter from .base import ProviderAdapter
from ..llm_response import ParsedDelta, LLMResponse from ..llm_response import ParsedDelta
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)
@ -233,12 +234,12 @@ class AnthropicAdapter(ProviderAdapter):
# Tool use block start # Tool use block start
tool_index = chunk.get("index", 0) tool_index = chunk.get("index", 0)
tool_name = block.get("name", "") tool_name = block.get("name", "")
result.tool_calls = [{ result.tool_call = {
"index": tool_index, "index": tool_index,
"id": "", "id": "",
"type": "function", "type": "function",
"function": {"name": tool_name, "arguments": ""} "function": {"name": tool_name, "arguments": ""}
}] }
elif block_type == self.SUBTYPE_TEXT: elif block_type == self.SUBTYPE_TEXT:
# Text block start - nothing to output yet # Text block start - nothing to output yet
@ -262,13 +263,11 @@ class AnthropicAdapter(ProviderAdapter):
elif delta_type == self.DELTA_INPUT_JSON: elif delta_type == self.DELTA_INPUT_JSON:
# Tool arguments delta (incremental) # Tool arguments delta (incremental)
partial_json = delta.get("partial_json", "") partial_json = delta.get("partial_json", "")
# For tool calls, we need to update the arguments
# This is handled by the consumer (AgenticLoop)
if partial_json: if partial_json:
result.tool_calls = [{ result.tool_call = {
"index": 0, "index": 0,
"function": {"arguments": partial_json} "function": {"arguments": partial_json}
}] }
elif chunk_type == self.BLOCK_CONTENT_BLOCK_STOP: elif chunk_type == self.BLOCK_CONTENT_BLOCK_STOP:
# Content block stop # Content block stop
@ -297,7 +296,7 @@ class AnthropicAdapter(ProviderAdapter):
if result.has_content() or result.is_complete: if result.has_content() or result.is_complete:
yield result yield result
def parse_response(self, data: Dict[str, Any]) -> LLMResponse: def parse_response(self, data: Dict[str, Any]) -> Dict:
"""Parse non-streaming response""" """Parse non-streaming response"""
content = data.get("content", []) content = data.get("content", [])
thinking = "" thinking = ""
@ -321,16 +320,19 @@ class AnthropicAdapter(ProviderAdapter):
usage = data.get("usage", {}) usage = data.get("usage", {})
return LLMResponse( return {
content=text_content, "content": text_content,
thinking=thinking, "thinking": thinking,
tool_calls=tool_calls, "tool_calls": tool_calls,
usage={ "usage": {
"prompt_tokens": usage.get("input_tokens", 0), "prompt_tokens": usage.get("input_tokens", 0),
"completion_tokens": usage.get("output_tokens", 0), "completion_tokens": usage.get("output_tokens", 0),
"total_tokens": usage.get("input_tokens", 0) + usage.get("output_tokens", 0) "total_tokens": usage.get("input_tokens", 0) + usage.get("output_tokens", 0)
} }
) }
def supports_thinking(self) -> bool: def supports_thinking(self) -> bool:
return True return True
def supports_tools(self) -> bool:
return True

View File

@ -1,200 +1,86 @@
"""OpenAI Adapter - OpenAI-compatible API adapter """OpenAI Adapter - OpenAI/DeepSeek/GLM/MiniMax compatible API adapter"""
Supports OpenAI, DeepSeek, GLM and other OpenAI-compatible APIs.
"""
import json import json
import logging import logging
from typing import Dict, List, Any, AsyncGenerator, Optional from typing import Dict, List, Any, AsyncGenerator
from .base import ProviderAdapter from .base import ProviderAdapter
from ..llm_response import ParsedDelta, LLMResponse from ..llm_response import ParsedDelta
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)
class OpenAIAdapter(ProviderAdapter): class OpenAIAdapter(ProviderAdapter):
"""OpenAI-compatible API adapter """OpenAI-compatible API adapter"""
Pure parsing adapter - no internal state management. def __init__(self):
Each parse_stream_chunk call returns incremental content. pass
Accumulation is handled by the consumer (AgenticLoop).
"""
@property @property
def provider_type(self) -> str: def provider_type(self) -> str:
return "openai" return "openai"
def __init__(self): def build_request(self, model: str, messages: List[Dict], tools=None, **kwargs) -> tuple:
pass
def build_request(
self,
model: str,
messages: List[Dict[str, Any]],
tools: List[Dict[str, Any]] = None,
**kwargs
) -> tuple[Dict[str, Any], Dict[str, str]]:
"""Build OpenAI-format request"""
api_key = kwargs.get("api_key", "") api_key = kwargs.get("api_key", "")
headers = {"Content-Type": "application/json", "Authorization": f"Bearer {api_key}"}
headers = { body = {"model": model, "messages": messages, "stream": kwargs.get("stream", True)}
"Content-Type": "application/json",
"Authorization": f"Bearer {api_key}"
}
body = {
"model": model,
"messages": messages,
"stream": kwargs.get("stream", True)
}
# Optional parameters
if "temperature" in kwargs: if "temperature" in kwargs:
body["temperature"] = kwargs["temperature"] body["temperature"] = kwargs["temperature"]
if "max_tokens" in kwargs: if "max_tokens" in kwargs:
body["max_tokens"] = kwargs["max_tokens"] body["max_tokens"] = kwargs["max_tokens"]
if "top_p" in kwargs:
body["top_p"] = kwargs["top_p"]
if "frequency_penalty" in kwargs:
body["frequency_penalty"] = kwargs["frequency_penalty"]
if "presence_penalty" in kwargs:
body["presence_penalty"] = kwargs["presence_penalty"]
if "stop" in kwargs:
body["stop"] = kwargs["stop"]
if tools: if tools:
body["tools"] = tools body["tools"] = tools
if kwargs.get("thinking_enabled"): body["tool_choice"] = "auto"
body["thinking_enabled"] = True
return body, headers return body, headers
def reset(self): def reset(self):
"""No-op for pure parsing adapter"""
pass pass
async def parse_stream_chunk( async def parse_stream_chunk(self, raw_chunk: str) -> AsyncGenerator[ParsedDelta, None]:
self, """Parse OpenAI/MiniMax format. Returns raw content for accumulation."""
raw_chunk: str if not raw_chunk or not raw_chunk.strip():
) -> AsyncGenerator[ParsedDelta, None]: return
"""Parse OpenAI-format SSE stream
Returns incremental content - no accumulation. chunk_str = raw_chunk.strip()
""" if chunk_str.startswith("data: "):
# Parse SSE line chunk_str = chunk_str[6:]
event_type, data_str = self._parse_sse_line(raw_chunk) elif chunk_str.startswith("data:"):
chunk_str = chunk_str[5:]
if not data_str or data_str == "[DONE]": if chunk_str.strip() == "[DONE]":
if data_str == "[DONE]": yield ParsedDelta(is_complete=True)
yield ParsedDelta(is_complete=True)
return return
try: try:
chunk = json.loads(data_str) chunk = json.loads(chunk_str)
except json.JSONDecodeError: except json.JSONDecodeError:
return return
# Handle errors choices = chunk.get("choices", [])
if event_type == "error" or "error" in chunk: if not choices:
yield ParsedDelta()
return return
# Extract usage delta = choices[0].get("delta", {})
usage = chunk.get("usage", {}) finish_reason = choices[0].get("finish_reason")
content = delta.get("content", "")
# Parse choices
for choice in chunk.get("choices", []):
delta = choice.get("delta", {})
content = delta.get("content") or ""
# Extract thinking tags if present
thinking, clean_text = self._extract_tags(content)
# Tool calls
tool_calls = delta.get("tool_calls", [])
# Check if this is the final delta
is_complete = bool(choice.get("finish_reason"))
if thinking or clean_text or tool_calls or is_complete or usage:
yield ParsedDelta(
thinking=thinking,
text=clean_text,
tool_calls=tool_calls if tool_calls else [],
is_complete=is_complete,
usage=usage if usage else {}
)
def parse_response(self, data: Dict[str, Any]) -> LLMResponse:
"""Parse non-streaming response"""
choice = data.get("choices", [{}])[0]
message = choice.get("message", {})
content = message.get("content", "") or ""
thinking, clean_content = self._extract_tags(content)
if not thinking:
thinking = message.get("reasoning_content") or ""
tool_calls = message.get("tool_calls", [])
usage = data.get("usage", {})
return LLMResponse(
content=clean_content,
thinking=thinking,
tool_calls=tool_calls,
usage=usage
)
def _parse_sse_line(self, line: str) -> tuple:
"""Parse a single SSE line, return (event_type, data)"""
if line.startswith("event:"):
return line[6:].strip(), None
elif line.startswith("data:"):
return "", line[5:].strip()
return "", None
def _extract_tags(self, content: str) -> tuple:
"""Extract thinking tags and return (thinking, clean_text)
Handles thinking tags that may be split across chunks:
- First </think> in content closes any thinking block
- Everything before first </think> is thinking
- Everything after first </think> is clean text
"""
if not content: if not content:
return "", "" if finish_reason is not None:
yield ParsedDelta(is_complete=True)
return
content_lower = content.lower() yield ParsedDelta(content=content)
# Find first </think> (marks end of thinking block) def parse_response(self, data: Dict) -> Dict:
end_idx = content_lower.find("</think>") """Parse non-streaming response."""
choices = data.get("choices", [])
if not choices:
return {"content": "", "tool_calls": [], "usage": {}}
message = choices[0].get("message", {})
content = message.get("content", "")
tool_calls = message.get("tool_calls", [])
usage = data.get("usage", {})
return {"content": content, "tool_calls": tool_calls, "usage": usage}
if end_idx != -1: def supports_tools(self) -> bool:
# Found end tag - split at this point return True
thinking_content = content[:end_idx].strip()
# Find if there's also a start tag before this
start_idx = content_lower.rfind("<think>", 0, end_idx)
if start_idx != -1:
# There's a complete thinking block
thinking = content[start_idx + 7:end_idx]
clean = content[end_idx + 9:]
else:
# No start tag - this is the end of a split thinking block
# Everything before </think> was thinking
thinking = content[:end_idx]
clean = content[end_idx + 9:]
return thinking, clean
# No end tag found
# Check if there's a start tag
start_idx = content_lower.find("<think>")
if start_idx != -1:
# Has start tag but no end - all content after start is thinking
thinking = content[start_idx + 7:]
return thinking, ""
else:
# No tags at all - everything is clean
return "", content

View File

@ -17,7 +17,7 @@ Usage:
# Streaming call # Streaming call
async for delta in client.stream_call(model, messages, tools=tools): async for delta in client.stream_call(model, messages, tools=tools):
print(delta.text, delta.thinking, delta.tool_calls) print(delta.text, delta.thinking, delta.tool_call)
""" """
import json import json
import logging import logging
@ -32,7 +32,7 @@ from luxx.services.llm_adapters import (
OpenAIAdapter, OpenAIAdapter,
AnthropicAdapter, AnthropicAdapter,
) )
from luxx.services.llm_response import ParsedDelta, LLMResponse from luxx.services.llm_response import ParsedDelta
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)
@ -160,7 +160,7 @@ class LLMClient:
messages: List[Dict[str, Any]], messages: List[Dict[str, Any]],
tools: List[Dict[str, Any]] = None, tools: List[Dict[str, Any]] = None,
**kwargs **kwargs
) -> LLMResponse: ) -> Dict:
"""Synchronous call to LLM (non-streaming) """Synchronous call to LLM (non-streaming)
Args: Args:
@ -170,7 +170,7 @@ class LLMClient:
**kwargs: Other parameters (temperature, max_tokens, thinking_enabled, etc.) **kwargs: Other parameters (temperature, max_tokens, thinking_enabled, etc.)
Returns: Returns:
LLMResponse object Dict with keys: content, thinking, tool_calls, usage
""" """
import asyncio import asyncio
return asyncio.get_event_loop().run_until_complete( return asyncio.get_event_loop().run_until_complete(
@ -183,7 +183,7 @@ class LLMClient:
messages: List[Dict[str, Any]], messages: List[Dict[str, Any]],
tools: List[Dict[str, Any]] = None, tools: List[Dict[str, Any]] = None,
**kwargs **kwargs
) -> LLMResponse: ) -> Dict:
"""Internal async sync call""" """Internal async sync call"""
model = model or self.default_model model = model or self.default_model
kwargs["api_key"] = self.api_key kwargs["api_key"] = self.api_key
@ -259,9 +259,14 @@ class LLMClient:
response.raise_for_status() response.raise_for_status()
async for line in response.aiter_lines(): async for line in response.aiter_lines():
if line.strip(): # MiniMax may send multiple SSE events concatenated on one line
async for delta in self.adapter.parse_stream_chunk(line): # Format: data: {...}\ndata: {...}\n
yield delta parts = line.split("data: ")
for part in parts:
part = part.strip()
if part and part != "[DONE]" and part.startswith("{"):
async for delta in self.adapter.parse_stream_chunk("data: " + part):
yield delta
except httpx.HTTPStatusError as e: except httpx.HTTPStatusError as e:
status_code = e.response.status_code if e.response else "?" status_code = e.response.status_code if e.response else "?"

View File

@ -1,65 +1,60 @@
"""LLM Response - Unified message classes for LLM communication """LLM Response - Unified message classes for LLM communication"""
This module provides unified data classes for message passing throughout the LLM pipeline.
"""
from typing import Dict, Any, List, Optional
from dataclasses import dataclass, field from dataclasses import dataclass, field
from typing import Dict, Optional
class StepType:
"""Step type constants"""
THINKING = "thinking"
TEXT = "text"
TOOL_CALL = "tool_call"
TOOL_RESULT = "tool_result"
@dataclass
class Step:
"""Single step - used for storage and transport"""
id: str
index: int
type: str
content: str = ""
name: str = ""
arguments: str = ""
id_ref: str = ""
success: bool = True
def to_dict(self) -> Dict:
return {
"id": self.id,
"index": self.index,
"type": self.type,
"content": self.content,
"name": self.name,
"arguments": self.arguments,
"id_ref": self.id_ref,
"success": self.success
}
@dataclass @dataclass
class ParsedDelta: class ParsedDelta:
"""Streaming response delta """LLM streaming response delta"""
content: str = ""
Represents a single unit of streaming response data.
Used for streaming responses where content is accumulated incrementally.
Attributes:
thinking: Accumulated thinking/reasoning content
text: Accumulated text content
tool_calls: List of tool call requests
is_complete: Whether this is the final delta
usage: Token usage statistics
"""
thinking: str = "" thinking: str = ""
text: str = "" text: str = ""
tool_calls: List[Dict] = field(default_factory=list) tool_call: Optional[Dict] = None
is_complete: bool = False
usage: Dict[str, int] = field(default_factory=dict) usage: Dict[str, int] = field(default_factory=dict)
is_complete: bool = False
def has_thinking(self) -> bool: def has_thinking(self) -> bool:
"""Check if there's thinking content"""
return bool(self.thinking) return bool(self.thinking)
def has_text(self) -> bool: def has_text(self) -> bool:
"""Check if there's text content"""
return bool(self.text) return bool(self.text)
def has_tool_calls(self) -> bool: def has_tool_call(self) -> bool:
"""Check if there are tool calls""" return self.tool_call is not None
return bool(self.tool_calls)
def has_content(self) -> bool: def has_content(self) -> bool:
"""Check if there's any content""" return bool(self.content) or self.has_thinking() or self.has_text() or self.has_tool_call()
return self.has_thinking() or self.has_text() or self.has_tool_calls()
@dataclass
class LLMResponse:
"""Complete LLM response
Represents a complete non-streaming response.
Attributes:
content: Final text content
thinking: Final thinking content (if any)
tool_calls: List of tool calls (if any)
usage: Token usage statistics
"""
content: str = ""
thinking: str = ""
tool_calls: List[Dict] = field(default_factory=list)
usage: Dict[str, int] = field(default=dict)
def has_tool_calls(self) -> bool:
"""Check if there are tool calls"""
return bool(self.tool_calls)

View File

@ -1,37 +0,0 @@
"""ProcessResult - Result of processing an SSE line."""
class ProcessResult:
"""Result of processing an SSE line.
Attributes:
events: List of SSE event strings to yield
has_error: Whether an error occurred
error_content: Error message if any
has_content: Whether content was received
has_tool_calls: Whether tool calls were received
"""
def __init__(self):
self.events: list = []
self.has_error: bool = False
self.error_content: str = ""
self.has_content: bool = False
self.has_tool_calls: bool = False
def add_event(self, event: str):
"""Add an event to the result."""
self.events.append(event)
def set_error(self, content: str):
"""Set error state."""
self.has_error = True
self.error_content = content
def set_content(self):
"""Mark that content was received."""
self.has_content = True
def set_tool_calls(self):
"""Mark that tool calls were received."""
self.has_tool_calls = True

View File

@ -1,25 +1,19 @@
"""StreamContext - Manages streaming state transitions during LLM response. """StreamContext - Manages streaming state transitions during LLM response."""
Tracks steps in order:
- thinking: Model reasoning content
- text: Model response text
- tool_call: Tool invocation request
- tool_result: Tool execution result
Each step has unique id and index for frontend rendering.
"""
import json import json
from typing import List, Dict, Optional from typing import List, Dict, Optional
from luxx.services.llm_response import Step, StepType
THINK_START = "<think>"
THINK_END = "</think>"
def _sse_event(event: str, data: dict) -> str: def _sse_event(event: str, data: dict) -> str:
"""Format a Server-Sent Event string."""
return f"event: {event}\ndata: {json.dumps(data, ensure_ascii=False)}\n\n" return f"event: {event}\ndata: {json.dumps(data, ensure_ascii=False)}\n\n"
class StreamContext: class StreamContext:
"""Manages streaming state transitions during LLM response."""
def __init__(self): def __init__(self):
self.step_index = 0 self.step_index = 0
self.current_step_id = None self.current_step_id = None
@ -27,25 +21,95 @@ class StreamContext:
self.current_step_type = None self.current_step_type = None
self.full_content = "" self.full_content = ""
self.full_thinking = "" self.full_thinking = ""
self.all_steps = [] self.all_steps: List[Step] = []
self.all_tool_calls = [] self.all_tool_results: List[Dict] = []
self.all_tool_results = [] self.tool_calls_list: List[Dict] = []
self.tool_calls_list = []
self._last_message_id = None self._last_message_id = None
self._last_token_count = 0 self._last_token_count = 0
self._last_usage = None self._last_usage = None
self._in_thinking = False
self._thinking_buf = ""
self._text_buf = ""
def reset(self): def reset(self):
"""Reset state for new iteration."""
self.current_step_id = None self.current_step_id = None
self.current_step_idx = None self.current_step_idx = None
self.current_step_type = None self.current_step_type = None
self.full_content = "" self.full_content = ""
self.full_thinking = "" self.full_thinking = ""
self.tool_calls_list = [] self.tool_calls_list = []
self._in_thinking = False
self._thinking_buf = ""
self._text_buf = ""
def process_content(self, content: str) -> Dict:
"""Process raw content, handling thinking tags.
Returns dict with:
- thinking: accumulated thinking content (when thinking block ends)
- text: accumulated text content (when thinking block ends)
- should_emit: whether to emit a step
- thinking_only: whether only thinking was found (no text yet)
"""
if not content:
return {"thinking": "", "text": "", "should_emit": False, "thinking_only": False}
thinking = ""
text = ""
should_emit = False
thinking_only = False
# Check for thinking start
if THINK_START in content and not self._in_thinking:
self._in_thinking = True
idx = content.find(THINK_START) + len(THINK_START)
content = content[idx:]
# Check for thinking end
if THINK_END in content:
idx = content.find(THINK_END)
# Extract thinking content
thinking_content = content[:idx]
self._thinking_buf += thinking_content
# Extract text after first</think>
content = content[idx + len(THINK_END):]
# Look for second</think> (MiniMax format: </think> 正文 </think> 正文)
if THINK_END in content:
second_idx = content.find(THINK_END)
text_content = content[:second_idx]
self._text_buf += text_content
content = content[second_idx + len(THINK_END):]
self._in_thinking = False
should_emit = True
thinking_only = not bool(self._text_buf)
# Accumulate to buffers
if self._in_thinking:
self._thinking_buf += content
else:
self._text_buf += content
if should_emit:
thinking = self._thinking_buf
text = self._text_buf
return {
"thinking": thinking,
"text": text,
"should_emit": should_emit,
"thinking_only": thinking_only
}
def flush(self):
thinking = self._thinking_buf
text = self._text_buf
self._thinking_buf = ""
self._text_buf = ""
return thinking, text
def start_step(self, step_type: str) -> str: def start_step(self, step_type: str) -> str:
"""Start a new step with unique ID."""
self.current_step_idx = self.step_index self.current_step_idx = self.step_index
self.current_step_id = f"step-{self.step_index}" self.current_step_id = f"step-{self.step_index}"
self.current_step_type = step_type self.current_step_type = step_type
@ -53,20 +117,18 @@ class StreamContext:
return self.current_step_id return self.current_step_id
def finalize_step(self): def finalize_step(self):
"""Save current step to all_steps."""
if self.current_step_id is None: if self.current_step_id is None:
return return
content = self.full_content if self.current_step_type == StepType.TEXT else self.full_thinking
content = self.full_content if self.current_step_type == "text" else self.full_thinking step = Step(
self.all_steps.append({ id=self.current_step_id,
"id": self.current_step_id, index=self.current_step_idx,
"index": self.current_step_idx, type=self.current_step_type,
"type": self.current_step_type, content=content
"content": content )
}) self.all_steps.append(step)
def accumulate_tool_call(self, tc_delta: Dict): def accumulate_tool_call(self, tc_delta: Dict):
"""Accumulate tool call delta."""
idx = tc_delta.get("index", 0) idx = tc_delta.get("index", 0)
if idx >= len(self.tool_calls_list): if idx >= len(self.tool_calls_list):
self.tool_calls_list.append({ self.tool_calls_list.append({
@ -74,7 +136,6 @@ class StreamContext:
"type": "function", "type": "function",
"function": {"name": "", "arguments": ""} "function": {"name": "", "arguments": ""}
}) })
func = tc_delta.get("function", {}) func = tc_delta.get("function", {})
if func.get("name"): if func.get("name"):
self.tool_calls_list[idx]["function"]["name"] += func["name"] self.tool_calls_list[idx]["function"]["name"] += func["name"]
@ -82,31 +143,25 @@ class StreamContext:
self.tool_calls_list[idx]["function"]["arguments"] += func["arguments"] self.tool_calls_list[idx]["function"]["arguments"] += func["arguments"]
def emit_tool_calls(self) -> List[str]: def emit_tool_calls(self) -> List[str]:
"""Emit tool call steps, return SSE events."""
events = [] events = []
for tc in self.tool_calls_list: for tc in self.tool_calls_list:
step_id = f"step-{self.step_index}" step_id = f"step-{self.step_index}"
self.step_index += 1 self.step_index += 1
step = Step(
step = { id=step_id,
"id": step_id, index=self.step_index - 1,
"index": self.step_index - 1, type=StepType.TOOL_CALL,
"type": "tool_call", name=tc["function"]["name"],
"id_ref": tc.get("id", ""), arguments=tc["function"]["arguments"],
"name": tc["function"]["name"], id_ref=tc.get("id", "")
"arguments": tc["function"]["arguments"] )
}
self.all_steps.append(step) self.all_steps.append(step)
self.all_tool_calls.append(tc) events.append(_sse_event("process_step", {"step": step.to_dict()}))
events.append(_sse_event("process_step", {"step": step}))
return events return events
def emit_tool_result(self, result: Dict, ref_step_id: str) -> tuple: def emit_tool_result(self, result: Dict, ref_step_id: str) -> tuple:
"""Emit tool result step, return (step, event)."""
step_id = f"step-{self.step_index}" step_id = f"step-{self.step_index}"
self.step_index += 1 self.step_index += 1
content = result.get("content", "") content = result.get("content", "")
success = True success = True
try: try:
@ -115,33 +170,45 @@ class StreamContext:
success = parsed.get("success", True) success = parsed.get("success", True)
except (json.JSONDecodeError, TypeError): except (json.JSONDecodeError, TypeError):
pass pass
step = Step(
step = { id=step_id,
"id": step_id, index=self.step_index - 1,
"index": self.step_index - 1, type=StepType.TOOL_RESULT,
"type": "tool_result", name=result.get("name", ""),
"id_ref": ref_step_id, content=content,
"name": result.get("name", ""), id_ref=ref_step_id,
"content": content, success=success
"success": success )
}
self.all_steps.append(step) self.all_steps.append(step)
self.all_tool_results.append({ self.all_tool_results.append({
"role": "tool", "role": "tool",
"tool_call_id": result.get("tool_call_id", ""), "tool_call_id": result.get("tool_call_id", ""),
"content": content "content": content
}) })
return step, _sse_event("process_step", {"step": step.to_dict()})
return step, _sse_event("process_step", {"step": step}) def emit_thinking(self) -> str:
step = Step(
id=self.current_step_id,
index=self.current_step_idx,
type=StepType.THINKING,
content=self.full_thinking
)
return _sse_event("process_step", {"step": step.to_dict()})
def emit_text(self) -> str:
step = Step(
id=self.current_step_id,
index=self.current_step_idx,
type=StepType.TEXT,
content=self.full_content
)
return _sse_event("process_step", {"step": step.to_dict()})
def set_completion(self, msg_id: str, token_count: int, usage: dict): def set_completion(self, msg_id: str, token_count: int, usage: dict):
"""Set completion info for saving."""
self._last_message_id = msg_id self._last_message_id = msg_id
self._last_token_count = token_count self._last_token_count = token_count
self._last_usage = usage self._last_usage = usage
def reset_completion(self): def get_steps_for_save(self) -> List[Dict]:
"""Reset completion info.""" return [step.to_dict() for step in self.all_steps]
self._last_message_id = None
self._last_token_count = 0
self._last_usage = None