eta_llm_client.go 6.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253
  1. package eta_llm
  2. import (
  3. "bufio"
  4. "bytes"
  5. "encoding/json"
  6. "errors"
  7. "eta/eta_api/models"
  8. "eta/eta_api/utils"
  9. "eta/eta_api/utils/llm"
  10. "eta/eta_api/utils/llm/eta_llm/eta_llm_http"
  11. "fmt"
  12. "io"
  13. "net/http"
  14. "strings"
  15. "sync"
  16. )
  17. var (
  18. dsOnce sync.Once
  19. etaLlmClient *ETALLMClient
  20. )
  21. const (
  22. KNOWLEDEG_CHAT_MODE = "local_kb"
  23. DEFALUT_PROMPT_NAME = "default"
  24. CONTENT_TYPE_JSON = "application/json"
  25. KNOWLEDGE_BASE_CHAT_API = "/chat/kb_chat"
  26. DOCUMENT_CHAT_API = "/chat/file_chat"
  27. KNOWLEDGE_BASE_SEARCH_DOCS_API = "/knowledge_base/search_docs"
  28. )
  29. type ETALLMClient struct {
  30. *llm.LLMClient
  31. LlmModel string
  32. }
  33. type LLMConfig struct {
  34. LlmAddress string `json:"llm_server"`
  35. LlmModel string `json:"llm_model"`
  36. }
  37. func GetInstance() llm.LLMService {
  38. dsOnce.Do(func() {
  39. confStr := models.BusinessConfMap[models.LLMInitConfig]
  40. if confStr == "" {
  41. utils.FileLog.Error("LLM配置为空")
  42. return
  43. }
  44. var config LLMConfig
  45. err := json.Unmarshal([]byte(confStr), &config)
  46. if err != nil {
  47. utils.FileLog.Error("LLM配置错误")
  48. }
  49. if etaLlmClient == nil {
  50. etaLlmClient = &ETALLMClient{
  51. LLMClient: llm.NewLLMClient(config.LlmAddress, 120),
  52. LlmModel: config.LlmModel,
  53. }
  54. }
  55. })
  56. return etaLlmClient
  57. }
  58. func (ds *ETALLMClient) DocumentChat(query string, KnowledgeId string, history []json.RawMessage, stream bool) (llmRes *http.Response, err error) {
  59. ChatHistory := make([]eta_llm_http.HistoryContent, 0)
  60. for _, historyItemStr := range history {
  61. var historyItem eta_llm_http.HistoryContent
  62. parseErr := json.Unmarshal(historyItemStr, &historyItem)
  63. if parseErr != nil {
  64. continue
  65. }
  66. //str := strings.Split(historyItemStr, "-")
  67. //historyItem := eta_llm_http.HistoryContent{
  68. // Role: str[0],
  69. // Content: str[1],
  70. //}
  71. ChatHistory = append(ChatHistory, historyItem)
  72. }
  73. kbReq := eta_llm_http.DocumentChatRequest{
  74. Query: query,
  75. KnowledgeId: KnowledgeId,
  76. History: ChatHistory,
  77. TopK: 3,
  78. //ScoreThreshold: 0.5,
  79. ScoreThreshold: 2,
  80. Stream: stream,
  81. ModelName: ds.LlmModel,
  82. //Temperature: 0.7,
  83. Temperature: 0.01,
  84. MaxTokens: 0,
  85. //PromptName: DEFALUT_PROMPT_NAME,
  86. }
  87. //fmt.Printf("%v", kbReq.History)
  88. body, err := json.Marshal(kbReq)
  89. fmt.Println(string(body))
  90. if err != nil {
  91. return
  92. }
  93. return ds.DoStreamPost(DOCUMENT_CHAT_API, body)
  94. }
  95. func (ds *ETALLMClient) KnowledgeBaseChat(query string, KnowledgeBaseName string, history []json.RawMessage) (llmRes *http.Response, err error) {
  96. ChatHistory := make([]eta_llm_http.HistoryContent, 0)
  97. for _, historyItemStr := range history {
  98. //str := strings.Split(historyItemStr, "-")
  99. //historyItem := eta_llm_http.HistoryContent{
  100. // Role: str[0],
  101. // Content: str[1],
  102. //}
  103. var historyItem eta_llm_http.HistoryContent
  104. parseErr := json.Unmarshal(historyItemStr, &historyItem)
  105. if parseErr != nil {
  106. continue
  107. }
  108. ChatHistory = append(ChatHistory, historyItem)
  109. }
  110. kbReq := eta_llm_http.KbChatRequest{
  111. Query: query,
  112. Mode: KNOWLEDEG_CHAT_MODE,
  113. KbName: KnowledgeBaseName,
  114. History: ChatHistory,
  115. TopK: 3,
  116. ScoreThreshold: 0.5,
  117. Stream: true,
  118. Model: ds.LlmModel,
  119. Temperature: 0.7,
  120. MaxTokens: 0,
  121. PromptName: DEFALUT_PROMPT_NAME,
  122. ReturnDirect: false,
  123. }
  124. fmt.Printf("%v", kbReq.History)
  125. body, err := json.Marshal(kbReq)
  126. if err != nil {
  127. return
  128. }
  129. return ds.DoStreamPost(KNOWLEDGE_BASE_CHAT_API, body)
  130. }
  131. func (ds *ETALLMClient) SearchKbDocs(query string, KnowledgeBaseName string) (content interface{}, err error) {
  132. kbReq := eta_llm_http.KbSearchDocsRequest{
  133. Query: query,
  134. KnowledgeBaseName: KnowledgeBaseName,
  135. TopK: 10,
  136. ScoreThreshold: 0.5,
  137. Metadata: struct{}{},
  138. }
  139. body, err := json.Marshal(kbReq)
  140. if err != nil {
  141. return
  142. }
  143. resp, err := ds.DoPost(KNOWLEDGE_BASE_SEARCH_DOCS_API, body)
  144. if !resp.Success {
  145. err = errors.New(resp.Msg)
  146. return
  147. }
  148. if resp.Data != nil {
  149. var kbSearchRes []eta_llm_http.SearchDocsResponse
  150. err = json.Unmarshal(resp.Data, &kbSearchRes)
  151. if err != nil {
  152. err = errors.New("搜索知识库失败")
  153. return
  154. }
  155. content = kbSearchRes
  156. return
  157. }
  158. err = errors.New("搜索知识库失败")
  159. return
  160. }
  161. func init() {
  162. err := llm.Register(llm.ETA_LLM_CLIENT, GetInstance())
  163. if err != nil {
  164. utils.FileLog.Error("注册eta_llm_server服务失败:", err)
  165. }
  166. }
  167. func (ds *ETALLMClient) DoPost(apiUrl string, body []byte) (baseResp eta_llm_http.BaseResponse, err error) {
  168. requestReader := bytes.NewReader(body)
  169. response, err := ds.HttpClient.Post(ds.BaseURL+apiUrl, CONTENT_TYPE_JSON, requestReader)
  170. if err != nil {
  171. return
  172. }
  173. return parseResponse(response)
  174. }
  175. func (ds *ETALLMClient) DoStreamPost(apiUrl string, body []byte) (baseResp *http.Response, err error) {
  176. requestReader := bytes.NewReader(body)
  177. return ds.HttpClient.Post(ds.BaseURL+apiUrl, CONTENT_TYPE_JSON, requestReader)
  178. }
  179. func parseResponse(response *http.Response) (baseResp eta_llm_http.BaseResponse, err error) {
  180. defer func() {
  181. _ = response.Body.Close()
  182. }()
  183. baseResp.Ret = response.StatusCode
  184. if response.StatusCode != http.StatusOK {
  185. baseResp.Msg = fmt.Sprintf("请求失败,状态码:%d, 状态信息:%s", response.StatusCode, http.StatusText(response.StatusCode))
  186. return
  187. }
  188. bodyBytes, err := io.ReadAll(response.Body)
  189. if err != nil {
  190. err = fmt.Errorf("读取响应体失败: %w", err)
  191. return
  192. }
  193. baseResp.Success = true
  194. baseResp.Data = bodyBytes
  195. return
  196. }
  197. func ParseStreamResponse(response *http.Response) (contentChan chan string, errChan chan error, closeChan chan struct{}) {
  198. contentChan = make(chan string, 10)
  199. errChan = make(chan error, 10)
  200. closeChan = make(chan struct{})
  201. go func() {
  202. defer close(contentChan)
  203. defer close(errChan)
  204. defer close(closeChan)
  205. scanner := bufio.NewScanner(response.Body)
  206. scanner.Split(bufio.ScanLines)
  207. for scanner.Scan() {
  208. line := scanner.Text()
  209. if line == "" {
  210. continue
  211. }
  212. // 忽略 "ping" 行
  213. if strings.HasPrefix(line, ": ping") {
  214. continue
  215. }
  216. // 去除 "data: " 前缀
  217. if strings.HasPrefix(line, "data: ") {
  218. line = strings.TrimPrefix(line, "data: ")
  219. }
  220. var chunk eta_llm_http.ChunkResponse
  221. if err := json.Unmarshal([]byte(line), &chunk); err != nil {
  222. fmt.Println("解析错误的line:" + line)
  223. errChan <- fmt.Errorf("解析 JSON 块失败: %w", err)
  224. return
  225. }
  226. // 处理每个 chunk
  227. if chunk.Choices != nil && len(chunk.Choices) > 0 {
  228. for _, choice := range chunk.Choices {
  229. if choice.Delta.Content != "" {
  230. contentChan <- choice.Delta.Content
  231. }
  232. }
  233. }
  234. }
  235. if err := scanner.Err(); err != nil {
  236. errChan <- fmt.Errorf("读取响应体失败: %w", err)
  237. return
  238. }
  239. }()
  240. return
  241. }