117 lines
2.7 KiB
Go
117 lines
2.7 KiB
Go
|
|
package eino
|
|||
|
|
|
|||
|
|
import (
|
|||
|
|
"bytes"
|
|||
|
|
"context"
|
|||
|
|
"encoding/json"
|
|||
|
|
"fmt"
|
|||
|
|
"io"
|
|||
|
|
"net/http"
|
|||
|
|
"time"
|
|||
|
|
|
|||
|
|
"github.com/cloudwego/eino/schema"
|
|||
|
|
"github.com/gogf/gf/v2/frame/g"
|
|||
|
|
)
|
|||
|
|
|
|||
|
|
// DashScopeReranker 通义百炼 Rerank 精排(Cross-Encoder)
|
|||
|
|
type DashScopeReranker struct {
|
|||
|
|
httpClient *http.Client
|
|||
|
|
}
|
|||
|
|
|
|||
|
|
func NewDashScopeReranker() *DashScopeReranker {
|
|||
|
|
return &DashScopeReranker{
|
|||
|
|
httpClient: &http.Client{
|
|||
|
|
Timeout: 10 * time.Second,
|
|||
|
|
},
|
|||
|
|
}
|
|||
|
|
}
|
|||
|
|
|
|||
|
|
// Rerank 对文档进行精排(Cross-Encoder 核心)
|
|||
|
|
func (d *DashScopeReranker) Rerank(ctx context.Context, query string, docs []*schema.Document) ([]*schema.Document, error) {
|
|||
|
|
if len(docs) == 0 {
|
|||
|
|
return docs, nil
|
|||
|
|
}
|
|||
|
|
|
|||
|
|
// 官方必过 URL
|
|||
|
|
url := "https://dashscope.aliyuncs.com/api/v1/services/rerank/text-rerank/text-rerank"
|
|||
|
|
apiKey := g.Cfg().MustGet(ctx, "eino.rerank.apiKey").String()
|
|||
|
|
model := g.Cfg().MustGet(ctx, "eino.rerank.model").String()
|
|||
|
|
|
|||
|
|
documents := make([]string, len(docs))
|
|||
|
|
for i, doc := range docs {
|
|||
|
|
documents[i] = doc.Content
|
|||
|
|
}
|
|||
|
|
|
|||
|
|
reqBody := map[string]any{
|
|||
|
|
"model": model,
|
|||
|
|
"input": map[string]any{
|
|||
|
|
"query": query,
|
|||
|
|
"documents": documents,
|
|||
|
|
},
|
|||
|
|
"parameters": map[string]any{
|
|||
|
|
"top_n": len(docs),
|
|||
|
|
},
|
|||
|
|
}
|
|||
|
|
bs, _ := json.Marshal(reqBody)
|
|||
|
|
|
|||
|
|
req, _ := http.NewRequestWithContext(ctx, "POST", url, bytes.NewBuffer(bs))
|
|||
|
|
req.Header.Set("Authorization", "Bearer "+apiKey)
|
|||
|
|
req.Header.Set("Content-Type", "application/json")
|
|||
|
|
|
|||
|
|
resp, err := d.httpClient.Do(req)
|
|||
|
|
if err != nil {
|
|||
|
|
return nil, err
|
|||
|
|
}
|
|||
|
|
defer resp.Body.Close()
|
|||
|
|
|
|||
|
|
if resp.StatusCode < 200 || resp.StatusCode >= 300 {
|
|||
|
|
body, _ := io.ReadAll(resp.Body)
|
|||
|
|
return nil, fmt.Errorf("rerank api error: status=%d, body=%s", resp.StatusCode, string(body))
|
|||
|
|
}
|
|||
|
|
|
|||
|
|
// 解析结果
|
|||
|
|
var result struct {
|
|||
|
|
Output struct {
|
|||
|
|
Results []struct {
|
|||
|
|
Index int `json:"index"`
|
|||
|
|
RelevanceScore float64 `json:"relevance_score"`
|
|||
|
|
} `json:"results"`
|
|||
|
|
} `json:"output"`
|
|||
|
|
}
|
|||
|
|
|
|||
|
|
if err := json.NewDecoder(resp.Body).Decode(&result); err != nil {
|
|||
|
|
return nil, err
|
|||
|
|
}
|
|||
|
|
|
|||
|
|
// 按分数排序
|
|||
|
|
type scoredDoc struct {
|
|||
|
|
doc *schema.Document
|
|||
|
|
score float64
|
|||
|
|
}
|
|||
|
|
scored := make([]scoredDoc, len(docs))
|
|||
|
|
for i, doc := range docs {
|
|||
|
|
scored[i] = scoredDoc{doc: doc, score: 0}
|
|||
|
|
}
|
|||
|
|
for _, res := range result.Output.Results {
|
|||
|
|
scored[res.Index].score = res.RelevanceScore
|
|||
|
|
}
|
|||
|
|
|
|||
|
|
// 分数从高到低排序
|
|||
|
|
for i := 0; i < len(scored); i++ {
|
|||
|
|
for j := i + 1; j < len(scored); j++ {
|
|||
|
|
if scored[j].score > scored[i].score {
|
|||
|
|
scored[i], scored[j] = scored[j], scored[i]
|
|||
|
|
}
|
|||
|
|
}
|
|||
|
|
}
|
|||
|
|
|
|||
|
|
// 输出最终排好的文档
|
|||
|
|
ranked := make([]*schema.Document, 0, len(scored))
|
|||
|
|
for _, s := range scored {
|
|||
|
|
s.doc.MetaData["rerank_score"] = s.score
|
|||
|
|
ranked = append(ranked, s.doc)
|
|||
|
|
}
|
|||
|
|
|
|||
|
|
return ranked, nil
|
|||
|
|
}
|