使用Go语言实现ReAct模型

ReAct 框架是一个结合了推理和行动的通用范例，通过交错生成推理轨迹和任务特定操作，使 LLM (大型语言模型) 能够与外部工具交互来获取额外信息，从而给出更可靠和实际的回应。

核心架构设计

ReAct 模型的核心是思考(Reasoning)→ 行动(Action)→ 观察(Observation)的循环机制。使用 Go 语言实现这一架构时，我们可以设计以下核心组件:

1
type ReactAgent struct {
2
    llm         LLMClient
3
    tools       []Tool
4
    context     *Context
5
    maxTurns    int
6
    prompter    Prompter
7
}

1. 主循环设计

Go 语言的强类型特性和简洁的并发模型非常适合实现 ReAct 的主循环：

1
func (agent *ReactAgent) Process(userInput string) (string, error) {
2
    // 初始化上下文
3
    agent.context = NewContext(userInput)
4

5
    for i := 0; i < agent.maxTurns; i++ {
6
        // 1. 推理阶段 - 生成思考过程
7
        reasoning, err := agent.generateReasoning()
8
        if err != nil {
9
            return "", fmt.Errorf("推理生成失败: %w", err)
10
        }
11
        agent.context.AddReasoning(reasoning)
12

13
        // 2. 行动阶段 - 判断是否需要执行工具
14
        if agent.isActionRequired(reasoning) {
15
            actionName, actionParams := agent.extractAction(reasoning)
16
            agent.context.SetAction(actionName, actionParams)
17

18
            // 执行工具调用
19
            observation := agent.executeAction(actionName, actionParams)
20
            agent.context.AddObservation(observation)
21
        } else {
22
            // 3. 回答阶段 - 如不需要执行工具，提取最终答案
23
            finalAnswer := agent.extractFinalAnswer(reasoning)
24
            if finalAnswer != "" {
25
                return finalAnswer, nil
26
            }
27
        }
28
    }
29

30
    // 达到最大轮次仍未得到答案时的处理
31
    return agent.generateFallbackResponse(), nil
32
}

这个主循环设计遵循 ReAct 的核心理念：

迭代式推理：通过多轮交互不断完善思考
工具调用：基于推理结果决定是否调用外部工具
观察反馈：将工具执行结果纳入上下文，用于后续推理

2. 提示(Prompts)设计

有效的提示设计是 ReAct 成功的关键。我们可以创建一个专用的 Prompter 接口：

1
type Prompter interface {
2
    GeneratePrompt(context *Context, tools []Tool) string
3
}
4

5
type DefaultPrompter struct {
6
    template string
7
}
8

9
func (p *DefaultPrompter) GeneratePrompt(context *Context, tools []Tool) string {
10
    // 实现提示模板的渲染逻辑
11
    tmpl, _ := template.New("prompt").Parse(p.template)
12
    var buf bytes.Buffer
13

14
    data := map[string]interface{}{
15
        "Tools":         tools,
16
        "UserInput":     context.UserInput,
17
        "HistoryExists": len(context.History) > 0,
18
        "History":       context.History,
19
    }
20

21
    tmpl.Execute(&buf, data)
22
    return buf.String()
23
}

ReAct 提示模板示例：

1
您是一个能够思考和行动的AI助手。请按照以下格式回答问题:
2

3
思考：请分析问题并思考解决方案。将复杂问题分解为子步骤并展示您的推理过程。
4

5
行动：[工具名称]([参数])
6
可用工具:
7
{{range .Tools}}
8
- {{.Name}}: {{.Description}}
9
  参数: {{.Parameters}}
10
{{end}}
11

12
观察：[工具执行的结果将显示在这里]
13

14
回答：[收集足够信息后] 提供最终完整答案。
15

16
用户问题: {{.UserInput}}
17

18
{{if .HistoryExists}}
19
历史交互:
20
{{range .History}}
21
思考: {{.Reasoning}}
22
{{if .ActionPerformed}}
23
行动: {{.ActionName}}({{.ActionParams}})
24
观察: {{.Observation}}
25
{{end}}
26
{{end}}
27
{{end}}
28

29
请开始您的思考:

这种提示设计：

明确格式要求：清晰定义了”思考”、“行动”和”观察”的格式规范
工具说明：动态列出可用工具及其参数要求
历史记忆：包含之前所有交互记录，建立持续对话能力
引导式生成：引导 LLM 按照 ReAct 范式进行输出

3. 工具集成设计

Go 语言的接口特性很适合设计灵活的工具系统：

1
// Tool接口定义
2
type Tool interface {
3
    Name() string
4
    Description() string
5
    Parameters() string
6
    Execute(params string) string
7
}
8

9
// 搜索工具实现
10
type SearchTool struct {
11
    apiClient *http.Client
12
    apiKey    string
13
}
14

15
func (t *SearchTool) Name() string {
16
    return "search"
17
}
18

19
func (t *SearchTool) Description() string {
20
    return "在网络上搜索最新信息"
21
}
22

23
func (t *SearchTool) Parameters() string {
24
    return "搜索查询(string)"
25
}
26

27
func (t *SearchTool) Execute(params string) string {
28
    // 实现搜索API调用...
29
    return "搜索结果..."
30
}
31

32
// 计算器工具实现
33
type CalculatorTool struct{}
34

35
func (t *CalculatorTool) Name() string {
36
    return "calculator"
37
}
38

39
func (t *CalculatorTool) Description() string {
40
    return "执行数学计算"
41
}
42

43
func (t *CalculatorTool) Parameters() string {
44
    return "数学表达式(string)"
45
}
46

47
func (t *CalculatorTool) Execute(params string) string {
48
    // 实现数学表达式计算...
49
    return "计算结果..."
50
}

工具调用的辅助函数：

1
func (agent *ReactAgent) executeAction(name string, params string) string {
2
    tool := agent.findTool(name)
3
    if tool == nil {
4
        return fmt.Sprintf("错误: 未找到工具 '%s'", name)
5
    }
6

7
    // 可添加超时控制和错误处理
8
    ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
9
    defer cancel()
10

11
    resultCh := make(chan string, 1)
12
    errCh := make(chan error, 1)
13

14
    go func() {
15
        defer func() {
16
            if r := recover(); r != nil {
17
                errCh <- fmt.Errorf("工具执行崩溃: %v", r)
18
            }
19
        }()
20

21
        result := tool.Execute(params)
22
        resultCh <- result
23
    }()
24

25
    select {
26
    case result := <-resultCh:
27
        return result
28
    case err := <-errCh:
29
        return fmt.Sprintf("工具执行错误: %v", err)
30
    case <-ctx.Done():
31
        return "工具执行超时"
32
    }
33
}

4. LLM 客户端集成

使用 Go 调用 LLM API 的接口设计：

1
type LLMClient interface {
2
    Generate(prompt string) (string, error)
3
}
4

5
// OpenAI客户端实现
6
type OpenAIClient struct {
7
    client  *http.Client
8
    apiKey  string
9
    model   string
10
    baseURL string
11
}
12

13
func NewOpenAIClient(apiKey, model string) *OpenAIClient {
14
    return &OpenAIClient{
15
        client:  &http.Client{Timeout: 30 * time.Second},
16
        apiKey:  apiKey,
17
        model:   model,
18
        baseURL: "https://api.openai.com/v1/chat/completions",
19
    }
20
}
21

22
func (c *OpenAIClient) Generate(prompt string) (string, error) {
23
    // 构建请求体
24
    reqBody, _ := json.Marshal(map[string]interface{}{
25
        "model": c.model,
26
        "messages": []map[string]string{
27
            {"role": "user", "content": prompt},
28
        },
29
        "temperature": 0.7,
30
    })
31

32
    // 创建请求
33
    req, err := http.NewRequest("POST", c.baseURL, bytes.NewBuffer(reqBody))
34
    if err != nil {
35
        return "", err
36
    }
37

38
    // 设置请求头
39
    req.Header.Set("Content-Type", "application/json")
40
    req.Header.Set("Authorization", "Bearer "+c.apiKey)
41

42
    // 发送请求
43
    resp, err := c.client.Do(req)
44
    if err != nil {
45
        return "", err
46
    }
47
    defer resp.Body.Close()
48

49
    // 解析响应
50
    var result map[string]interface{}
51
    json.NewDecoder(resp.Body).Decode(&result)
52

53
    // 提取生成的文本
54
    choices, ok := result["choices"].([]interface{})
55
    if !ok || len(choices) == 0 {
56
        return "", fmt.Errorf("无效的API响应")
57
    }
58

59
    choice := choices[0].(map[string]interface{})
60
    message := choice["message"].(map[string]interface{})
61
    content := message["content"].(string)
62

63
    return content, nil
64
}

5. 上下文管理

设计上下文结构来维护交互历史：

1
// 上下文结构
2
type Context struct {
3
    UserInput string
4
    History   []Exchange
5
}
6

7
// 交互记录结构
8
type Exchange struct {
9
    Reasoning      string
10
    ActionPerformed bool
11
    ActionName     string
12
    ActionParams   string
13
    Observation    string
14
}
15

16
func NewContext(userInput string) *Context {
17
    return &Context{
18
        UserInput: userInput,
19
        History:   []Exchange{},
20
    }
21
}
22

23
// 添加推理到上下文
24
func (c *Context) AddReasoning(reasoning string) {
25
    c.History = append(c.History, Exchange{
26
        Reasoning: reasoning,
27
    })
28
}
29

30
// 设置行动信息
31
func (c *Context) SetAction(name, params string) {
32
    lastIdx := len(c.History) - 1
33
    if lastIdx >= 0 {
34
        c.History[lastIdx].ActionPerformed = true
35
        c.History[lastIdx].ActionName = name
36
        c.History[lastIdx].ActionParams = params
37
    }
38
}
39

40
// 添加观察结果
41
func (c *Context) AddObservation(observation string) {
42
    lastIdx := len(c.History) - 1
43
    if lastIdx >= 0 {
44
        c.History[lastIdx].Observation = observation
45
    }
46
}
47

48
// 获取当前上下文的令牌估计数量
49
func (c *Context) EstimateTokens() int {
50
    // 简单估计：每4个字符约为1个token
51
    totalChars := len(c.UserInput)
52

53
    for _, exchange := range c.History {
54
        totalChars += len(exchange.Reasoning)
55
        totalChars += len(exchange.ActionName)
56
        totalChars += len(exchange.ActionParams)
57
        totalChars += len(exchange.Observation)
58
    }
59

60
    return totalChars / 4
61
}

6. 辅助解析函数

设计解析 LLM 输出的辅助函数：

1
// 解析行动
2
func (agent *ReactAgent) extractAction(reasoning string) (name string, params string) {
3
    // 使用正则表达式提取行动名称和参数
4
    actionRegex := regexp.MustCompile(`行动: (\w+)\((.+?)\)`)
5
    matches := actionRegex.FindStringSubmatch(reasoning)
6

7
    if len(matches) >= 3 {
8
        name = matches[1]
9
        params = matches[2]
10
    }
11

12
    return
13
}
14

15
// 判断是否需要执行工具
16
func (agent *ReactAgent) isActionRequired(reasoning string) bool {
17
    return strings.Contains(reasoning, "行动:") && !strings.Contains(reasoning, "回答:")
18
}
19

20
// 提取最终答案
21
func (agent *ReactAgent) extractFinalAnswer(reasoning string) string {
22
    answerRegex := regexp.MustCompile(`回答: ([\s\S]+)`)
23
    matches := answerRegex.FindStringSubmatch(reasoning)
24

25
    if len(matches) >= 2 {
26
        return matches[1]
27
    }
28

29
    return ""
30
}

7. 完整系统集成

主程序示例：

1
func main() {
2
    // 初始化LLM客户端
3
    llmClient := NewOpenAIClient(os.Getenv("OPENAI_API_KEY"), "gpt-4")
4

5
    // 初始化工具集
6
    tools := []Tool{
7
        &SearchTool{},
8
        &CalculatorTool{},
9
        &WeatherTool{},
10
        &DatabaseTool{},
11
    }
12

13
    // 创建默认提示器
14
    prompter := &DefaultPrompter{
15
        template: promptTemplate, // 上面定义的模板
16
    }
17

18
    // 创建ReAct代理
19
    agent := &ReactAgent{
20
        llm:      llmClient,
21
        tools:    tools,
22
        maxTurns: 5,
23
        prompter: prompter,
24
    }
25

26
    // 处理用户查询
27
    userInput := "中国和美国的时差是多少，并计算如果中国现在是下午3点，美国是几点？"
28
    result, err := agent.Process(userInput)
29
    if err != nil {
30
        fmt.Printf("错误: %v\n", err)
31
        return
32
    }
33

34
    fmt.Println("最终回答:", result)
35
}

8. Go 实现 ReAct 的优势与挑战

优势

并发处理能力：使用 goroutine 和 channel 可实现工具并行执行和超时控制

1
// 并行执行多个工具示例
2
func (agent *ReactAgent) executeParallelActions(actions []Action) []Observation {
3
    results := make([]Observation, len(actions))
4
    var wg sync.WaitGroup
5

6
    for i, action := range actions {
7
        wg.Add(1)
8
        go func(idx int, act Action) {
9
            defer wg.Done()
10
            tool := agent.findTool(act.Name)
11
            if tool == nil {
12
                results[idx] = Observation{Error: "工具不存在"}
13
                return
14
            }
15

16
            result := tool.Execute(act.Params)
17
            results[idx] = Observation{Result: result}
18
        }(i, action)
19
    }
20

21
    wg.Wait()
22
    return results
23
}

类型安全：Go 的静态类型系统有助于减少运行时错误
部署便利性：编译为单一二进制文件，无需依赖，易于部署和分发

性能优势：执行效率高，适合处理高并发请求

1
// 高性能HTTP服务器示例
2
func setupServer(agent *ReactAgent) *http.Server {
3
    router := mux.NewRouter()
4

5
    router.HandleFunc("/react", func(w http.ResponseWriter, r *http.Request) {
6
        if r.Method != "POST" {
7
            http.Error(w, "仅支持POST请求", http.StatusMethodNotAllowed)
8
            return
9
        }
10

11
        var request struct {
12
            Query string `json:"query"`
13
        }
14

15
        if err := json.NewDecoder(r.Body).Decode(&request); err != nil {
16
            http.Error(w, "无效的请求格式", http.StatusBadRequest)
17
            return
18
        }
19

20
        result, err := agent.Process(request.Query)
21
        if err != nil {
22
            http.Error(w, err.Error(), http.StatusInternalServerError)
23
            return
24
        }
25

26
        json.NewEncoder(w).Encode(map[string]string{"response": result})
27
    })
28

29
    return &http.Server{
30
        Addr:         ":8080",
31
        Handler:      router,
32
        ReadTimeout:  60 * time.Second,
33
        WriteTimeout: 60 * time.Second,
34
    }
35
}

良好的 AI 生态支持：langchaingo、go-openai 等库提供了可靠的基础设施

挑战

提示工程复杂性：设计稳定可靠的提示模板需要反复调优

1
// 可能的解决方案：提示模板变体测试
2
func benchmarkPromptTemplates(client LLMClient, testCases []string) map[string]TemplateMetrics {
3
    templates := map[string]string{
4
        "标准模板": standardTemplate,
5
        "详细模板": verboseTemplate,
6
        "简洁模板": conciseTemplate,
7
    }
8

9
    results := make(map[string]TemplateMetrics)
10

11
    for name, template := range templates {
12
        prompter := &DefaultPrompter{template: template}
13
        metrics := evaluateTemplate(client, prompter, testCases)
14
        results[name] = metrics
15
    }
16

17
    return results
18
}

LLM 输出解析不稳定：不同 LLM 模型可能有不同的输出格式

1
// 可能的解决方案：多模式解析
2
func (agent *ReactAgent) extractActionMultiMode(reasoning string) (name string, params string) {
3
    // 尝试多种格式匹配
4
    patterns := []string{
5
        `行动: (\w+)\((.+?)\)`,
6
        `行动：(\w+)\((.+?)\)`,
7
        `Action: (\w+)\((.+?)\)`,
8
        `使用工具 (\w+) 参数是 (.+)`,
9
    }
10

11
    for _, pattern := range patterns {
12
        regex := regexp.MustCompile(pattern)
13
        matches := regex.FindStringSubmatch(reasoning)
14
        if len(matches) >= 3 {
15
            return matches[1], matches[2]
16
        }
17
    }
18

19
    return "", ""
20
}

上下文管理：长对话可能导致上下文溢出

1
// 可能的解决方案：上下文压缩
2
func (c *Context) Compress(maxTokens int) {
3
    currentTokens := c.EstimateTokens()
4
    if currentTokens <= maxTokens {
5
        return
6
    }
7

8
    // 计算需要压缩的令牌数
9
    excessTokens := currentTokens - maxTokens
10

11
    // 从最早的交互开始压缩
12
    for i := 0; i < len(c.History) && excessTokens > 0; i++ {
13
        // 保留行动和观察，但压缩推理部分
14
        exchange := &c.History[i]
15

16
        // 估算当前推理的令牌数
17
        reasoningTokens := len(exchange.Reasoning) / 4
18

19
        if reasoningTokens > 50 { // 只压缩较长的推理
20
            // 压缩为摘要
21
            exchange.Reasoning = fmt.Sprintf(
22
                "推理摘要: 经考虑后%s使用工具%s并获得结果",
23
                exchange.ActionPerformed ? "决定" : "没有",
24
                exchange.ActionName,
25
            )
26

27
            // 更新节省的令牌数
28
            savedTokens := reasoningTokens - (len(exchange.Reasoning) / 4)
29
            excessTokens -= savedTokens
30
        }
31
    }
32
}

工具执行安全性：需要防止恶意指令和潜在安全风险

1
// 可能的解决方案：安全管理器
2
type SafetyManager struct {
3
    blockedPatterns []string
4
    maxExecutionTime time.Duration
5
}
6

7
func (sm *SafetyManager) ValidateAction(name string, params string) error {
8
    // 检查工具名称是否在白名单中
9
    allowedTools := map[string]bool{
10
        "search": true,
11
        "calculator": true,
12
        "weather": true,
13
    }
14

15
    if !allowedTools[name] {
16
        return fmt.Errorf("未授权的工具: %s", name)
17
    }
18

19
    // 检查参数是否匹配阻止模式
20
    for _, pattern := range sm.blockedPatterns {
21
        if matched, _ := regexp.MatchString(pattern, params); matched {
22
            return fmt.Errorf("参数包含禁止内容")
23
        }
24
    }
25

26
    return nil
27
}

API 限制和费用：需要处理配额限制和成本控制

1
// 可能的解决方案：令牌使用跟踪和限制
2
type TokenUsageTracker struct {
3
    mu sync.Mutex
4
    usageByDay map[string]int
5
    limits map[string]int
6
}
7

8
func (t *TokenUsageTracker) TrackUsage(tokens int) (bool, error) {
9
    t.mu.Lock()
10
    defer t.mu.Unlock()
11

12
    today := time.Now().Format("2006-01-02")
13

14
    t.usageByDay[today] += tokens
15

16
    if limit, exists := t.limits[today]; exists && t.usageByDay[today] > limit {
17
        return false, fmt.Errorf("超出每日令牌限额")
18
    }
19

20
    return true, nil
21
}

总结

Go 语言实现 ReAct 模型是一个理想的选择，其强类型、并发模型和性能特性非常适合构建可靠的 AI 代理系统。通过分离关注点（提示管理、工具执行、LLM 交互等），我们可以创建出一个灵活、可扩展且高性能的 ReAct 实现。

主要实施建议：

使用接口抽象关键组件，便于替换和测试
充分利用 Go 的并发特性处理工具执行
实现健壮的错误处理和超时控制
关注提示工程和输出解析的稳定性
设计有效的上下文管理策略

通过这种架构，开发者可以构建出能够结合推理和行动能力的强大 AI 应用，同时充分利用 Go 语言的优势。