Spaces:
Sleeping
Sleeping
package monica | |
import ( | |
"bufio" | |
"bytes" | |
"fmt" | |
"io" | |
"sync" | |
"time" | |
"monica-proxy/internal/types" | |
"monica-proxy/internal/utils" | |
"net/http" | |
"strings" | |
"github.com/bytedance/sonic" | |
"github.com/sashabaranov/go-openai" | |
) | |
const ( | |
sseObject = "chat.completion.chunk" | |
sseFinish = "[DONE]" | |
flushInterval = 100 * time.Millisecond // 刷新间隔 | |
bufferSize = 4096 // 缓冲区大小 | |
dataPrefix = "data: " | |
dataPrefixLen = len(dataPrefix) | |
lineEnd = "\n\n" | |
) | |
// SSEData 用于解析 Monica SSE json | |
type SSEData struct { | |
Text string `json:"text"` | |
Finished bool `json:"finished"` | |
AgentStatus AgentStatus `json:"agent_status,omitempty"` | |
} | |
type AgentStatus struct { | |
UID string `json:"uid"` | |
Type string `json:"type"` | |
Text string `json:"text"` | |
Metadata struct { | |
Title string `json:"title"` | |
ReasoningDetail string `json:"reasoning_detail"` | |
} `json:"metadata"` | |
} | |
var sseDataPool = sync.Pool{ | |
New: func() interface{} { | |
return &SSEData{} | |
}, | |
} | |
// processMonicaSSE 处理Monica的SSE数据 | |
type processMonicaSSE struct { | |
reader *bufio.Reader | |
model string | |
buf []byte | |
} | |
// handleSSEData 处理单条SSE数据 | |
type handleSSEData func(*SSEData) error | |
// processSSEStream 处理SSE流 | |
func (p *processMonicaSSE) processSSEStream(handler handleSSEData) error { | |
if p.buf == nil { | |
p.buf = make([]byte, 4096) | |
} | |
var line []byte | |
var err error | |
for { | |
line, err = p.reader.ReadBytes('\n') | |
if err != nil { | |
if err == io.EOF { | |
return nil | |
} | |
return fmt.Errorf("read error: %w", err) | |
} | |
// Monica SSE 的行前缀一般是 "data: " | |
if len(line) < dataPrefixLen || !bytes.HasPrefix(line, []byte(dataPrefix)) { | |
continue | |
} | |
jsonStr := line[dataPrefixLen : len(line)-1] // 去掉\n | |
if len(jsonStr) == 0 { | |
continue | |
} | |
// 如果是 [DONE] 则结束 | |
if bytes.Equal(jsonStr, []byte(sseFinish)) { | |
return nil | |
} | |
// 从对象池获取一个对象 | |
sseData := sseDataPool.Get().(*SSEData) | |
// 解析 JSON | |
if err := sonic.Unmarshal(jsonStr, sseData); err != nil { | |
sseData = &SSEData{} | |
sseDataPool.Put(sseData) | |
return fmt.Errorf("unmarshal error: %w", err) | |
} | |
// 调用处理函数 | |
if err := handler(sseData); err != nil { | |
sseData = &SSEData{} | |
sseDataPool.Put(sseData) | |
return err | |
} | |
// 使用完后清理并放回对象池 | |
sseData = &SSEData{} | |
sseDataPool.Put(sseData) | |
} | |
} | |
// CollectMonicaSSEToCompletion 将 Monica SSE 转换为完整的 ChatCompletion 响应 | |
func CollectMonicaSSEToCompletion(model string, r io.Reader) (*openai.ChatCompletionResponse, error) { | |
var fullContent strings.Builder | |
processor := &processMonicaSSE{ | |
reader: bufio.NewReaderSize(r, bufferSize), | |
model: model, | |
} | |
// 处理SSE数据 | |
err := processor.processSSEStream(func(sseData *SSEData) error { | |
// 如果是 agent_status,跳过 | |
if sseData.AgentStatus.Type != "" { | |
return nil | |
} | |
// 累积内容 | |
fullContent.WriteString(sseData.Text) | |
return nil | |
}) | |
if err != nil { | |
return nil, err | |
} | |
// 构造完整的响应 | |
response := &openai.ChatCompletionResponse{ | |
ID: fmt.Sprintf("chatcmpl-%s", utils.RandStringUsingMathRand(29)), | |
Object: "chat.completion", | |
Created: time.Now().Unix(), | |
Model: model, | |
Choices: []openai.ChatCompletionChoice{ | |
{ | |
Index: 0, | |
Message: openai.ChatCompletionMessage{ | |
Role: "assistant", | |
Content: fullContent.String(), | |
}, | |
FinishReason: "stop", | |
}, | |
}, | |
Usage: openai.Usage{ | |
// Monica API 不提供 token 使用信息,这里暂时填 0 | |
PromptTokens: 0, | |
CompletionTokens: 0, | |
TotalTokens: 0, | |
}, | |
} | |
return response, nil | |
} | |
// StreamMonicaSSEToClient 将 Monica SSE 转成前端可用的流 | |
func StreamMonicaSSEToClient(model string, w io.Writer, r io.Reader) error { | |
writer := bufio.NewWriterSize(w, bufferSize) | |
defer writer.Flush() | |
chatId := utils.RandStringUsingMathRand(29) | |
now := time.Now().Unix() | |
fingerprint := utils.RandStringUsingMathRand(10) | |
// 创建一个定时刷新的 ticker | |
ticker := time.NewTicker(flushInterval) | |
defer ticker.Stop() | |
// 创建一个 done channel 用于清理 | |
done := make(chan struct{}) | |
defer close(done) | |
// 启动一个 goroutine 定期刷新缓冲区 | |
go func() { | |
for { | |
select { | |
case <-ticker.C: | |
if f, ok := w.(http.Flusher); ok { | |
writer.Flush() | |
f.Flush() | |
} | |
case <-done: | |
return | |
} | |
} | |
}() | |
processor := &processMonicaSSE{ | |
reader: bufio.NewReaderSize(r, bufferSize), | |
model: model, | |
} | |
var thinkFlag bool | |
return processor.processSSEStream(func(sseData *SSEData) error { | |
var sseMsg types.ChatCompletionStreamResponse | |
switch { | |
case sseData.Finished: | |
sseMsg = types.ChatCompletionStreamResponse{ | |
ID: "chatcmpl-" + chatId, | |
Object: sseObject, | |
Created: now, | |
Model: model, | |
Choices: []types.ChatCompletionStreamChoice{ | |
{ | |
Index: 0, | |
Delta: openai.ChatCompletionStreamChoiceDelta{ | |
Role: openai.ChatMessageRoleAssistant, | |
}, | |
FinishReason: openai.FinishReasonStop, | |
}, | |
}, | |
} | |
case sseData.AgentStatus.Type == "thinking": | |
thinkFlag = true | |
sseMsg = types.ChatCompletionStreamResponse{ | |
ID: "chatcmpl-" + chatId, | |
Object: sseObject, | |
SystemFingerprint: fingerprint, | |
Created: now, | |
Model: model, | |
Choices: []types.ChatCompletionStreamChoice{ | |
{ | |
Index: 0, | |
Delta: openai.ChatCompletionStreamChoiceDelta{ | |
Role: openai.ChatMessageRoleAssistant, | |
Content: `<think>`, | |
}, | |
FinishReason: openai.FinishReasonNull, | |
}, | |
}, | |
} | |
case sseData.AgentStatus.Type == "thinking_detail_stream": | |
sseMsg = types.ChatCompletionStreamResponse{ | |
ID: "chatcmpl-" + chatId, | |
Object: sseObject, | |
SystemFingerprint: fingerprint, | |
Created: now, | |
Model: model, | |
Choices: []types.ChatCompletionStreamChoice{ | |
{ | |
Index: 0, | |
Delta: openai.ChatCompletionStreamChoiceDelta{ | |
Role: openai.ChatMessageRoleAssistant, | |
Content: sseData.AgentStatus.Metadata.ReasoningDetail, | |
}, | |
FinishReason: openai.FinishReasonNull, | |
}, | |
}, | |
} | |
default: | |
if thinkFlag { | |
sseData.Text = "</think>" + sseData.Text | |
thinkFlag = false | |
} | |
sseMsg = types.ChatCompletionStreamResponse{ | |
ID: "chatcmpl-" + chatId, | |
Object: sseObject, | |
SystemFingerprint: fingerprint, | |
Created: now, | |
Model: model, | |
Choices: []types.ChatCompletionStreamChoice{ | |
{ | |
Index: 0, | |
Delta: openai.ChatCompletionStreamChoiceDelta{ | |
Role: openai.ChatMessageRoleAssistant, | |
Content: sseData.Text, | |
}, | |
FinishReason: openai.FinishReasonNull, | |
}, | |
}, | |
} | |
} | |
var sb strings.Builder | |
sb.WriteString("data: ") | |
sendLine, _ := sonic.MarshalString(sseMsg) | |
sb.WriteString(sendLine) | |
sb.WriteString("\n\n") | |
// 写入缓冲区 | |
if _, err := writer.WriteString(sb.String()); err != nil { | |
return fmt.Errorf("write error: %w", err) | |
} | |
// 如果发现 finished=true,就可以结束 | |
if sseData.Finished { | |
writer.WriteString(dataPrefix) | |
writer.WriteString(sseFinish) | |
writer.WriteString(lineEnd) | |
writer.Flush() | |
if f, ok := w.(http.Flusher); ok { | |
f.Flush() | |
} | |
return nil | |
} | |
sseData.AgentStatus.Type = "" | |
sseData.Finished = false | |
return nil | |
}) | |
} | |