eta_llm_client.go 5.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209
  1. package eta_llm
  2. import (
  3. "bufio"
  4. "bytes"
  5. "encoding/json"
  6. "errors"
  7. "eta/eta_api/models"
  8. "eta/eta_api/utils"
  9. "eta/eta_api/utils/llm"
  10. "eta/eta_api/utils/llm/eta_llm/eta_llm_http"
  11. "fmt"
  12. "io"
  13. "net/http"
  14. "strings"
  15. "sync"
  16. )
  17. var (
  18. dsOnce sync.Once
  19. etaLlmClient *ETALLMClient
  20. )
  21. const (
  22. KNOWLEDEG_CHAT_MODE = "local_kb"
  23. DEFALUT_PROMPT_NAME = "default"
  24. CONTENT_TYPE_JSON = "application/json"
  25. KNOWLEDGE_BASE_CHAT_API = "/chat/kb_chat"
  26. KNOWLEDGE_BASE_SEARCH_DOCS_API = "/knowledge_base/search_docs"
  27. )
  28. type ETALLMClient struct {
  29. *llm.LLMClient
  30. LlmModel string
  31. }
  32. type LLMConfig struct {
  33. LlmAddress string `json:"llm_server"`
  34. LlmModel string `json:"llm_model"`
  35. }
  36. func GetInstance() llm.LLMService {
  37. dsOnce.Do(func() {
  38. confStr := models.BusinessConfMap[models.LLMInitConfig]
  39. if confStr == "" {
  40. utils.FileLog.Error("LLM配置为空")
  41. return
  42. }
  43. var config LLMConfig
  44. err := json.Unmarshal([]byte(confStr), &config)
  45. if err != nil {
  46. utils.FileLog.Error("LLM配置错误")
  47. }
  48. if etaLlmClient == nil {
  49. etaLlmClient = &ETALLMClient{
  50. LLMClient: llm.NewLLMClient(config.LlmAddress, 120),
  51. LlmModel: config.LlmModel,
  52. }
  53. }
  54. })
  55. return etaLlmClient
  56. }
  57. func (ds *ETALLMClient) KnowledgeBaseChat(query string, KnowledgeBaseName string, history []string) (llmRes *http.Response, err error) {
  58. ChatHistory := make([]eta_llm_http.HistoryContent, 0)
  59. for _, historyItemStr := range history {
  60. str := strings.Split(historyItemStr, "-")
  61. historyItem := eta_llm_http.HistoryContent{
  62. Role: str[0],
  63. Content: str[1],
  64. }
  65. ChatHistory = append(ChatHistory, historyItem)
  66. }
  67. kbReq := eta_llm_http.KbChatRequest{
  68. Query: query,
  69. Mode: KNOWLEDEG_CHAT_MODE,
  70. KbName: KnowledgeBaseName,
  71. History: ChatHistory,
  72. TopK: 3,
  73. ScoreThreshold: 0.5,
  74. Stream: true,
  75. Model: ds.LlmModel,
  76. Temperature: 0.7,
  77. MaxTokens: 0,
  78. PromptName: DEFALUT_PROMPT_NAME,
  79. ReturnDirect: false,
  80. }
  81. fmt.Printf("%v", kbReq.History)
  82. body, err := json.Marshal(kbReq)
  83. if err != nil {
  84. return
  85. }
  86. return ds.DoStreamPost(KNOWLEDGE_BASE_CHAT_API, body)
  87. }
  88. func (ds *ETALLMClient) SearchKbDocs(query string, KnowledgeBaseName string) (content interface{}, err error) {
  89. kbReq := eta_llm_http.KbSearchDocsRequest{
  90. Query: query,
  91. KnowledgeBaseName: KnowledgeBaseName,
  92. TopK: 10,
  93. ScoreThreshold: 0.5,
  94. Metadata: struct{}{},
  95. }
  96. body, err := json.Marshal(kbReq)
  97. if err != nil {
  98. return
  99. }
  100. resp, err := ds.DoPost(KNOWLEDGE_BASE_SEARCH_DOCS_API, body)
  101. if !resp.Success {
  102. err = errors.New(resp.Msg)
  103. return
  104. }
  105. if resp.Data != nil {
  106. var kbSearchRes []eta_llm_http.SearchDocsResponse
  107. err = json.Unmarshal(resp.Data, &kbSearchRes)
  108. if err != nil {
  109. err = errors.New("搜索知识库失败")
  110. return
  111. }
  112. content = kbSearchRes
  113. return
  114. }
  115. err = errors.New("搜索知识库失败")
  116. return
  117. }
  118. func init() {
  119. err := llm.Register(llm.ETA_LLM_CLIENT, GetInstance())
  120. if err != nil {
  121. utils.FileLog.Error("注册eta_llm_server服务失败:", err)
  122. }
  123. }
  124. func (ds *ETALLMClient) DoPost(apiUrl string, body []byte) (baseResp eta_llm_http.BaseResponse, err error) {
  125. requestReader := bytes.NewReader(body)
  126. response, err := ds.HttpClient.Post(ds.BaseURL+apiUrl, CONTENT_TYPE_JSON, requestReader)
  127. if err != nil {
  128. return
  129. }
  130. return parseResponse(response)
  131. }
  132. func (ds *ETALLMClient) DoStreamPost(apiUrl string, body []byte) (baseResp *http.Response, err error) {
  133. requestReader := bytes.NewReader(body)
  134. return ds.HttpClient.Post(ds.BaseURL+apiUrl, CONTENT_TYPE_JSON, requestReader)
  135. }
  136. func parseResponse(response *http.Response) (baseResp eta_llm_http.BaseResponse, err error) {
  137. defer func() {
  138. _ = response.Body.Close()
  139. }()
  140. baseResp.Ret = response.StatusCode
  141. if response.StatusCode != http.StatusOK {
  142. baseResp.Msg = fmt.Sprintf("请求失败,状态码:%d, 状态信息:%s", response.StatusCode, http.StatusText(response.StatusCode))
  143. return
  144. }
  145. bodyBytes, err := io.ReadAll(response.Body)
  146. if err != nil {
  147. err = fmt.Errorf("读取响应体失败: %w", err)
  148. return
  149. }
  150. baseResp.Success = true
  151. baseResp.Data = bodyBytes
  152. return
  153. }
  154. func ParseStreamResponse(response *http.Response) (contentChan chan string, errChan chan error, closeChan chan struct{}) {
  155. contentChan = make(chan string, 10)
  156. errChan = make(chan error, 10)
  157. closeChan = make(chan struct{})
  158. go func() {
  159. defer close(contentChan)
  160. defer close(errChan)
  161. defer close(closeChan)
  162. scanner := bufio.NewScanner(response.Body)
  163. scanner.Split(bufio.ScanLines)
  164. for scanner.Scan() {
  165. line := scanner.Text()
  166. if line == "" {
  167. continue
  168. }
  169. // 忽略 "ping" 行
  170. if strings.HasPrefix(line, ": ping") {
  171. continue
  172. }
  173. // 去除 "data: " 前缀
  174. if strings.HasPrefix(line, "data: ") {
  175. line = strings.TrimPrefix(line, "data: ")
  176. }
  177. var chunk eta_llm_http.ChunkResponse
  178. if err := json.Unmarshal([]byte(line), &chunk); err != nil {
  179. fmt.Println("解析错误的line:" + line)
  180. errChan <- fmt.Errorf("解析 JSON 块失败: %w", err)
  181. return
  182. }
  183. // 处理每个 chunk
  184. if chunk.Choices != nil && len(chunk.Choices) > 0 {
  185. for _, choice := range chunk.Choices {
  186. if choice.Delta.Content != "" {
  187. contentChan <- choice.Delta.Content
  188. }
  189. }
  190. }
  191. }
  192. if err := scanner.Err(); err != nil {
  193. errChan <- fmt.Errorf("读取响应体失败: %w", err)
  194. return
  195. }
  196. }()
  197. return
  198. }