feat: 🏗️ 实现 Agent 消息可靠异步持久化(Outbox + Kafka) * 新增 Outbox 数据模型与消息载荷定义,位于 `backend/model/outbox.go` * 新增 Outbox DAO,支持创建、扫描、发布标记、失败重试与消费落库事务,位于 `backend/dao/outbox.go` * 新增 Kafka 基础封装,包含配置、生产者、消费者与消息包装,位于 `backend/kafka` 文件夹 * `config.go`:Kafka 配置文件 * `producer.go`:Kafka 生产者 * `consumer.go`:Kafka 消费者 * `envelope.go`:消息封装处理 * 新增异步管道服务,处理扫描投递与消费落库,位于 `backend/service/agent_async_pipeline.go` * 接入 Agent 聊天链路的可靠持久化,替换原有 goroutine 直接写库逻辑,位于 `backend/service/agent.go` * 启动流程接入管道初始化与启动,位于 `backend/cmd/start.go` * 增加 Kafka 配置项,更新 `backend/config.yaml` 与 `backend/config.example.yaml` * 引入 Kafka 依赖:`github.com/segmentio/kafka-go`(见 `backend/go.mod`, `backend/go.sum`) fix: 🐛 修复首启偶发 user 消息重复落库问题 * 解决因 Outbox 状态并发回写竞态,导致 `consumed` 被晚到的 `published` 覆盖的问题 * 在 `MarkPublished` 中增加条件,避免覆盖已标记为 `consumed` 或 `dead` 的消息,修复位置:`backend/dao/outbox.go` perf: ⚡ 更新 Docker Compose 配置与 Kafka 相关服务 * 更新 `docker-compose.yml` 文件,新增 Kafka 配置与服务 fix: 🧹 优化缓存删除逻辑 * 在 `cache deleter` 中忽略了 `model.AgentOutboxMessage`、`model.ChatHistory` 与 `model.AgentChat` 这三个结构体 * 防止这些结构体对应的表单删除缓存时,导致控制台消息爆炸
215 lines
5.8 KiB
Go
215 lines
5.8 KiB
Go
package service
|
|
|
|
import (
|
|
"context"
|
|
"encoding/json"
|
|
"errors"
|
|
"fmt"
|
|
"log"
|
|
"time"
|
|
|
|
"github.com/LoveLosita/smartflow/backend/dao"
|
|
kafkabus "github.com/LoveLosita/smartflow/backend/kafka"
|
|
"github.com/LoveLosita/smartflow/backend/model"
|
|
segmentkafka "github.com/segmentio/kafka-go"
|
|
"gorm.io/gorm"
|
|
)
|
|
|
|
// AgentAsyncPipeline 负责 outbox 扫描、Kafka 投递与消费落库。
|
|
type AgentAsyncPipeline struct {
|
|
outboxRepo *dao.OutboxDAO
|
|
producer *kafkabus.Producer
|
|
consumer *kafkabus.Consumer
|
|
topic string
|
|
maxRetry int
|
|
scanEvery time.Duration
|
|
scanBatch int
|
|
}
|
|
|
|
func NewAgentAsyncPipeline(outboxRepo *dao.OutboxDAO, cfg kafkabus.Config) (*AgentAsyncPipeline, error) {
|
|
if !cfg.Enabled {
|
|
return nil, nil
|
|
}
|
|
producer, err := kafkabus.NewProducer(cfg)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
consumer, err := kafkabus.NewConsumer(cfg)
|
|
if err != nil {
|
|
_ = producer.Close()
|
|
return nil, err
|
|
}
|
|
return &AgentAsyncPipeline{
|
|
outboxRepo: outboxRepo,
|
|
producer: producer,
|
|
consumer: consumer,
|
|
topic: cfg.Topic,
|
|
maxRetry: cfg.MaxRetry,
|
|
scanEvery: cfg.RetryScanInterval,
|
|
scanBatch: cfg.RetryBatchSize,
|
|
}, nil
|
|
}
|
|
|
|
func (p *AgentAsyncPipeline) Start(ctx context.Context) {
|
|
if p == nil {
|
|
return
|
|
}
|
|
go p.startDispatchLoop(ctx)
|
|
go p.startConsumeLoop(ctx)
|
|
}
|
|
|
|
func (p *AgentAsyncPipeline) Close() {
|
|
if p == nil {
|
|
return
|
|
}
|
|
if err := p.producer.Close(); err != nil {
|
|
log.Printf("关闭 Kafka producer 失败: %v", err)
|
|
}
|
|
if err := p.consumer.Close(); err != nil {
|
|
log.Printf("关闭 Kafka consumer 失败: %v", err)
|
|
}
|
|
}
|
|
|
|
func (p *AgentAsyncPipeline) EnqueueChatHistoryPersist(ctx context.Context, payload model.ChatHistoryPersistPayload) error {
|
|
if p == nil {
|
|
return errors.New("Kafka 异步链路未初始化")
|
|
}
|
|
outboxID, err := p.outboxRepo.CreateChatHistoryMessage(ctx, p.topic, payload.ConversationID, payload, p.maxRetry)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
if err = p.dispatchOne(context.Background(), outboxID); err != nil {
|
|
log.Printf("outbox 消息 %d 首次投递失败,等待扫描重试: %v", outboxID, err)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (p *AgentAsyncPipeline) startDispatchLoop(ctx context.Context) {
|
|
ticker := time.NewTicker(p.scanEvery)
|
|
defer ticker.Stop()
|
|
|
|
for {
|
|
select {
|
|
case <-ctx.Done():
|
|
return
|
|
case <-ticker.C:
|
|
pendingMessages, err := p.outboxRepo.ListDueMessages(ctx, p.scanBatch)
|
|
if err != nil {
|
|
log.Printf("扫描 outbox 失败: %v", err)
|
|
continue
|
|
}
|
|
for _, msg := range pendingMessages {
|
|
if err = p.dispatchOne(ctx, msg.ID); err != nil {
|
|
log.Printf("重试投递 outbox 消息失败(id=%d): %v", msg.ID, err)
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
func (p *AgentAsyncPipeline) dispatchOne(ctx context.Context, outboxID int64) error {
|
|
outboxMsg, err := p.outboxRepo.GetByID(ctx, outboxID)
|
|
if err != nil {
|
|
if errors.Is(err, gorm.ErrRecordNotFound) {
|
|
return nil
|
|
}
|
|
return err
|
|
}
|
|
if outboxMsg.Status == model.OutboxStatusConsumed || outboxMsg.Status == model.OutboxStatusDead {
|
|
return nil
|
|
}
|
|
|
|
envelope := kafkabus.Envelope{
|
|
OutboxID: outboxMsg.ID,
|
|
BizType: outboxMsg.BizType,
|
|
Payload: json.RawMessage(outboxMsg.Payload),
|
|
}
|
|
raw, err := json.Marshal(envelope)
|
|
if err != nil {
|
|
markErr := p.outboxRepo.MarkDead(ctx, outboxMsg.ID, "序列化 outbox 包裹失败: "+err.Error())
|
|
if markErr != nil {
|
|
log.Printf("标记 outbox 死信失败(id=%d): %v", outboxMsg.ID, markErr)
|
|
}
|
|
return err
|
|
}
|
|
|
|
if err = p.producer.Enqueue(ctx, outboxMsg.Topic, outboxMsg.MessageKey, raw); err != nil {
|
|
_ = p.outboxRepo.MarkFailedForRetry(ctx, outboxMsg.ID, "投递 Kafka 失败: "+err.Error())
|
|
return err
|
|
}
|
|
if err = p.outboxRepo.MarkPublished(ctx, outboxMsg.ID); err != nil {
|
|
_ = p.outboxRepo.MarkFailedForRetry(ctx, outboxMsg.ID, "更新已投递状态失败: "+err.Error())
|
|
return err
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (p *AgentAsyncPipeline) startConsumeLoop(ctx context.Context) {
|
|
for {
|
|
select {
|
|
case <-ctx.Done():
|
|
return
|
|
default:
|
|
}
|
|
|
|
msg, err := p.consumer.Dequeue(ctx)
|
|
if err != nil {
|
|
if errors.Is(err, context.Canceled) {
|
|
return
|
|
}
|
|
log.Printf("Kafka 消费拉取失败: %v", err)
|
|
time.Sleep(300 * time.Millisecond)
|
|
continue
|
|
}
|
|
if err = p.handleMessage(ctx, msg); err != nil {
|
|
log.Printf("处理 Kafka 消息失败(topic=%s, partition=%d, offset=%d): %v", msg.Topic, msg.Partition, msg.Offset, err)
|
|
}
|
|
}
|
|
}
|
|
|
|
func (p *AgentAsyncPipeline) handleMessage(ctx context.Context, msg segmentkafka.Message) error {
|
|
var envelope kafkabus.Envelope
|
|
if err := json.Unmarshal(msg.Value, &envelope); err != nil {
|
|
_ = p.consumer.Commit(ctx, msg)
|
|
return fmt.Errorf("解析 Kafka 包裹失败: %w", err)
|
|
}
|
|
if envelope.OutboxID <= 0 {
|
|
_ = p.consumer.Commit(ctx, msg)
|
|
return errors.New("Kafka 包裹缺少 outbox_id")
|
|
}
|
|
|
|
switch envelope.BizType {
|
|
case model.OutboxBizTypeChatHistoryPersist:
|
|
return p.consumeChatHistory(ctx, msg, envelope)
|
|
default:
|
|
_ = p.outboxRepo.MarkDead(ctx, envelope.OutboxID, "未知业务类型: "+envelope.BizType)
|
|
if err := p.consumer.Commit(ctx, msg); err != nil {
|
|
return err
|
|
}
|
|
return nil
|
|
}
|
|
}
|
|
|
|
func (p *AgentAsyncPipeline) consumeChatHistory(ctx context.Context, msg segmentkafka.Message, envelope kafkabus.Envelope) error {
|
|
var payload model.ChatHistoryPersistPayload
|
|
if err := json.Unmarshal(envelope.Payload, &payload); err != nil {
|
|
_ = p.outboxRepo.MarkDead(ctx, envelope.OutboxID, "解析聊天持久化载荷失败: "+err.Error())
|
|
if commitErr := p.consumer.Commit(ctx, msg); commitErr != nil {
|
|
return commitErr
|
|
}
|
|
return nil
|
|
}
|
|
|
|
if err := p.outboxRepo.PersistChatHistoryAndMarkConsumed(ctx, envelope.OutboxID, payload); err != nil {
|
|
if markErr := p.outboxRepo.MarkFailedForRetry(ctx, envelope.OutboxID, "消费并落库失败: "+err.Error()); markErr != nil {
|
|
return markErr
|
|
}
|
|
if commitErr := p.consumer.Commit(ctx, msg); commitErr != nil {
|
|
return commitErr
|
|
}
|
|
return err
|
|
}
|
|
|
|
return p.consumer.Commit(ctx, msg)
|
|
}
|