eta_llm_client.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438
  1. package eta_llm
  2. import (
  3. "bufio"
  4. "bytes"
  5. "encoding/json"
  6. "errors"
  7. "eta/eta_api/models"
  8. "eta/eta_api/utils"
  9. "eta/eta_api/utils/llm"
  10. "eta/eta_api/utils/llm/eta_llm/eta_llm_http"
  11. "fmt"
  12. "io"
  13. "mime/multipart"
  14. "net/http"
  15. "os"
  16. "strings"
  17. "sync"
  18. )
  19. var (
  20. dsOnce sync.Once
  21. etaLlmClient *ETALLMClient
  22. modelRouter = map[string]string{
  23. "deepseek-r1:32b": "/dsr1",
  24. "qwq:32b": "/qwq",
  25. }
  26. )
  27. const (
  28. KNOWLEDEG_CHAT_MODE = "local_kb"
  29. DEFALUT_PROMPT_NAME = "default"
  30. CONTENT_TYPE_JSON = "application/json"
  31. KNOWLEDGE_BASE_CHAT_API = "/chat/kb_chat"
  32. COMPLETION_CHAT_API = "/chat/chat/completions"
  33. DOCUMENT_CHAT_API = "/chat/file_chat"
  34. KNOWLEDGE_BASE_SEARCH_DOCS_API = "/knowledge_base/search_docs"
  35. UPLOAD_TEMP_DOCS_API = "/knowledge_base/upload_temp_docs"
  36. )
  37. type ETALLMClient struct {
  38. *llm.LLMClient
  39. LlmModel string
  40. }
  41. type LLMConfig struct {
  42. LlmAddress string `json:"llm_server"`
  43. LlmModel string `json:"llm_model"`
  44. }
  45. func GetInstance() llm.LLMService {
  46. dsOnce.Do(func() {
  47. confStr := models.BusinessConfMap[models.LLMInitConfig]
  48. if confStr == "" {
  49. utils.FileLog.Error("LLM配置为空")
  50. return
  51. }
  52. var config LLMConfig
  53. err := json.Unmarshal([]byte(confStr), &config)
  54. if err != nil {
  55. utils.FileLog.Error("LLM配置错误")
  56. }
  57. if etaLlmClient == nil {
  58. etaLlmClient = &ETALLMClient{
  59. LLMClient: llm.NewLLMClient(config.LlmAddress, 300),
  60. LlmModel: config.LlmModel,
  61. }
  62. }
  63. })
  64. return etaLlmClient
  65. }
  66. func (ds *ETALLMClient) DocumentChat(query string, KnowledgeId string, history []json.RawMessage, stream bool) (llmRes *http.Response, err error) {
  67. ChatHistory := make([]eta_llm_http.HistoryContent, 0)
  68. for _, historyItemStr := range history {
  69. var historyItem eta_llm_http.HistoryContent
  70. parseErr := json.Unmarshal(historyItemStr, &historyItem)
  71. if parseErr != nil {
  72. continue
  73. }
  74. //str := strings.Split(historyItemStr, "-")
  75. //historyItem := eta_llm_http.HistoryContent{
  76. // Role: str[0],
  77. // Content: str[1],
  78. //}
  79. ChatHistory = append(ChatHistory, historyItem)
  80. }
  81. kbReq := eta_llm_http.DocumentChatRequest{
  82. Query: query,
  83. KnowledgeId: KnowledgeId,
  84. History: ChatHistory,
  85. TopK: 3,
  86. //ScoreThreshold: 0.5,
  87. ScoreThreshold: 2,
  88. Stream: stream,
  89. ModelName: ds.LlmModel,
  90. //Temperature: 0.7,
  91. Temperature: 0.01,
  92. MaxTokens: 0,
  93. //PromptName: DEFALUT_PROMPT_NAME,
  94. }
  95. //fmt.Printf("%v", kbReq.History)
  96. body, err := json.Marshal(kbReq)
  97. fmt.Println(string(body))
  98. if err != nil {
  99. return
  100. }
  101. return ds.DoStreamPost(DOCUMENT_CHAT_API, body)
  102. }
  103. func (ds *ETALLMClient) CompletionChat(query string, messages []json.RawMessage) (llmRes *http.Response, err error) {
  104. ChatHistory := make([]eta_llm_http.HistoryContent, 0)
  105. for _, historyItemStr := range messages {
  106. var historyItem eta_llm_http.HistoryContentWeb
  107. parseErr := json.Unmarshal(historyItemStr, &historyItem)
  108. if parseErr != nil {
  109. continue
  110. }
  111. ChatHistory = append(ChatHistory, eta_llm_http.HistoryContent{
  112. Content: historyItem.Content,
  113. Role: historyItem.Role,
  114. })
  115. }
  116. ChatHistory = append(ChatHistory, eta_llm_http.HistoryContent{
  117. Content: query,
  118. Role: "user",
  119. })
  120. kbReq := eta_llm_http.CompletionChatRequest{
  121. Mode: KNOWLEDEG_CHAT_MODE,
  122. Messages: ChatHistory,
  123. TopK: 3,
  124. ScoreThreshold: 0.5,
  125. Stream: true,
  126. Model: "qwq:32b",
  127. Temperature: 0.7,
  128. MaxTokens: 0,
  129. PromptName: DEFALUT_PROMPT_NAME,
  130. ReturnDirect: false,
  131. }
  132. fmt.Printf("%v", kbReq.Messages)
  133. utils.FileLog.Info("kbReq.Messages: %v", kbReq.Messages)
  134. body, err := json.Marshal(kbReq)
  135. if err != nil {
  136. return
  137. }
  138. return ds.DoStreamPost(COMPLETION_CHAT_API, body)
  139. }
  140. func (ds *ETALLMClient) KnowledgeBaseChat(query string, KnowledgeBaseName string, history []json.RawMessage) (llmRes *http.Response, err error) {
  141. ChatHistory := make([]eta_llm_http.HistoryContent, 0)
  142. for _, historyItemStr := range history {
  143. var historyItem eta_llm_http.HistoryContentWeb
  144. parseErr := json.Unmarshal(historyItemStr, &historyItem)
  145. if parseErr != nil {
  146. continue
  147. }
  148. ChatHistory = append(ChatHistory, eta_llm_http.HistoryContent{
  149. Content: historyItem.Content,
  150. Role: historyItem.Role,
  151. })
  152. }
  153. kbReq := eta_llm_http.KbChatRequest{
  154. Query: query,
  155. Mode: KNOWLEDEG_CHAT_MODE,
  156. KbName: KnowledgeBaseName,
  157. History: ChatHistory,
  158. TopK: 3,
  159. ScoreThreshold: 0.5,
  160. Stream: true,
  161. Model: ds.LlmModel,
  162. Temperature: 0.7,
  163. MaxTokens: 0,
  164. PromptName: DEFALUT_PROMPT_NAME,
  165. ReturnDirect: false,
  166. }
  167. fmt.Printf("%v", kbReq.History)
  168. body, err := json.Marshal(kbReq)
  169. if err != nil {
  170. return
  171. }
  172. return ds.DoStreamPost(KNOWLEDGE_BASE_CHAT_API, body)
  173. }
  174. func (ds *ETALLMClient) FileChat(query string, KnowledgeId string, llmModel string, history []json.RawMessage) (resp eta_llm_http.BaseResponse, err error) {
  175. ChatHistory := make([]eta_llm_http.HistoryContent, 0)
  176. for _, historyItemStr := range history {
  177. var historyItem eta_llm_http.HistoryContentWeb
  178. parseErr := json.Unmarshal(historyItemStr, &historyItem)
  179. if parseErr != nil {
  180. continue
  181. }
  182. ChatHistory = append(ChatHistory, eta_llm_http.HistoryContent{
  183. Content: historyItem.Content,
  184. Role: historyItem.Role,
  185. })
  186. }
  187. var model string
  188. if llmModel != "" {
  189. model = llmModel
  190. } else {
  191. model = ds.LlmModel
  192. }
  193. kbReq := eta_llm_http.DocumentChatRequest{
  194. ModelName: model,
  195. Query: query,
  196. KnowledgeId: KnowledgeId,
  197. History: ChatHistory,
  198. TopK: 20,
  199. ScoreThreshold: 2,
  200. Stream: false,
  201. Temperature: 0.01,
  202. MaxTokens: 0,
  203. PromptName: DEFALUT_PROMPT_NAME,
  204. }
  205. body, err := json.Marshal(kbReq)
  206. if err != nil {
  207. utils.FileLog.Error("内容生成失败,序列化请求参数失败,err", err.Error())
  208. err = fmt.Errorf("内容生成失败,序列化请求参数失败,err:%v", err)
  209. return
  210. }
  211. return ds.DoPost(fmt.Sprintf("%s%s", modelRouter[model], DOCUMENT_CHAT_API), body)
  212. }
  213. func (ds *ETALLMClient) UploadFileToTemplate(files []*os.File, param map[string]interface{}) (data interface{}, err error) {
  214. var pervId string
  215. if value, ok := param["PrevId"]; ok {
  216. pervId = value.(string)
  217. }
  218. var model string
  219. if value, ok := param["LLM"]; ok {
  220. model = value.(string)
  221. } else {
  222. model = ds.LlmModel
  223. }
  224. docReq := eta_llm_http.UploadTempDocsRequest{
  225. ChunkOverlap: "150",
  226. ChunkSize: "750",
  227. PrevId: pervId,
  228. ZhTitleEnhance: "false",
  229. }
  230. body, err := json.Marshal(docReq)
  231. if err != nil {
  232. return
  233. }
  234. resp, err := ds.DoFile(fmt.Sprintf("%s%s", modelRouter[model], UPLOAD_TEMP_DOCS_API), body, files)
  235. if !resp.Success {
  236. err = errors.New(resp.Msg)
  237. return
  238. }
  239. if resp.Data != nil {
  240. var uploadDocsRes eta_llm_http.RagBaseResponse
  241. err = json.Unmarshal(resp.Data, &uploadDocsRes)
  242. if err != nil {
  243. err = errors.New("上传临时文件失败,err:" + err.Error())
  244. return
  245. }
  246. if uploadDocsRes.Code != 200 {
  247. err = errors.New("上传临时文件失败,err:" + uploadDocsRes.Msg)
  248. return
  249. }
  250. var uploadResult eta_llm_http.UploadDocsResponse
  251. err = json.Unmarshal(uploadDocsRes.Data, &uploadResult)
  252. if len(uploadResult.FiledFiles) > 0 {
  253. utils.FileLog.Warn("上传临时文件失败:", uploadResult.FiledFiles)
  254. }
  255. data = uploadResult
  256. return
  257. }
  258. return
  259. }
  260. func (ds *ETALLMClient) SearchKbDocs(query string, KnowledgeBaseName string) (content interface{}, err error) {
  261. kbReq := eta_llm_http.KbSearchDocsRequest{
  262. Query: query,
  263. KnowledgeBaseName: KnowledgeBaseName,
  264. TopK: 10,
  265. ScoreThreshold: 0.5,
  266. Metadata: struct{}{},
  267. }
  268. body, err := json.Marshal(kbReq)
  269. if err != nil {
  270. return
  271. }
  272. resp, err := ds.DoPost(KNOWLEDGE_BASE_SEARCH_DOCS_API, body)
  273. if !resp.Success {
  274. err = errors.New(resp.Msg)
  275. return
  276. }
  277. if resp.Data != nil {
  278. var kbSearchRes []eta_llm_http.SearchDocsResponse
  279. err = json.Unmarshal(resp.Data, &kbSearchRes)
  280. if err != nil {
  281. err = errors.New("搜索知识库失败")
  282. return
  283. }
  284. content = kbSearchRes
  285. return
  286. }
  287. err = errors.New("搜索知识库失败")
  288. return
  289. }
  290. func init() {
  291. err := llm.Register(llm.ETA_LLM_CLIENT, GetInstance())
  292. if err != nil {
  293. utils.FileLog.Error("注册eta_llm_server服务失败:", err)
  294. }
  295. }
  296. func (ds *ETALLMClient) DoPost(apiUrl string, body []byte) (baseResp eta_llm_http.BaseResponse, err error) {
  297. requestReader := bytes.NewReader(body)
  298. response, err := ds.HttpClient.Post(ds.BaseURL+apiUrl, CONTENT_TYPE_JSON, requestReader)
  299. if err != nil {
  300. return
  301. }
  302. return parseResponse(response)
  303. }
  304. func (ds *ETALLMClient) DoFile(apiUrl string, body []byte, files []*os.File) (baseResp eta_llm_http.BaseResponse, err error) {
  305. var requestBody bytes.Buffer
  306. writer := multipart.NewWriter(&requestBody)
  307. // 添加文件到请求体
  308. for _, file := range files {
  309. filePath, err := writer.CreateFormFile("files", file.Name())
  310. if err != nil {
  311. return baseResp, fmt.Errorf("创建文件表单字段失败: %w", err)
  312. }
  313. _, err = io.Copy(filePath, file)
  314. if err != nil {
  315. return baseResp, fmt.Errorf("写入文件内容失败: %w", err)
  316. }
  317. }
  318. var params = make(map[string]string)
  319. err = json.Unmarshal(body, &params)
  320. if err != nil {
  321. return
  322. }
  323. // 添加其他参数到请求体
  324. for key, value := range params {
  325. err := writer.WriteField(key, value)
  326. if err != nil {
  327. return baseResp, fmt.Errorf("写入表单字段失败: %w", err)
  328. }
  329. }
  330. // 关闭 writer,完成请求体的构建
  331. err = writer.Close()
  332. if err != nil {
  333. return baseResp, fmt.Errorf("关闭 multipart writer 失败: %w", err)
  334. }
  335. request, err := http.NewRequest("POST", ds.BaseURL+apiUrl, &requestBody)
  336. request.Header.Set("Content-Type", writer.FormDataContentType())
  337. response, err := ds.HttpClient.Do(request)
  338. if err != nil {
  339. return
  340. }
  341. return parseResponse(response)
  342. }
  343. func (ds *ETALLMClient) DoStreamPost(apiUrl string, body []byte) (baseResp *http.Response, err error) {
  344. requestReader := bytes.NewReader(body)
  345. return ds.HttpClient.Post(ds.BaseURL+apiUrl, CONTENT_TYPE_JSON, requestReader)
  346. }
  347. func parseResponse(response *http.Response) (baseResp eta_llm_http.BaseResponse, err error) {
  348. defer func() {
  349. _ = response.Body.Close()
  350. }()
  351. baseResp.Ret = response.StatusCode
  352. if response.StatusCode != http.StatusOK {
  353. baseResp.Msg = fmt.Sprintf("请求失败,状态码:%d, 状态信息:%s", response.StatusCode, http.StatusText(response.StatusCode))
  354. return
  355. }
  356. bodyBytes, err := io.ReadAll(response.Body)
  357. if err != nil {
  358. err = fmt.Errorf("读取响应体失败: %w", err)
  359. return
  360. }
  361. baseResp.Success = true
  362. baseResp.Data = bodyBytes
  363. return
  364. }
  365. func ParseStreamResponse(response *http.Response) (contentChan chan string, errChan chan error, closeChan chan struct{}, closeLlmChan chan bool) {
  366. contentChan = make(chan string, 10)
  367. errChan = make(chan error, 10)
  368. closeChan = make(chan struct{})
  369. closeLlmChan = make(chan bool, 1)
  370. go func() {
  371. defer close(contentChan)
  372. defer close(errChan)
  373. defer close(closeChan)
  374. defer close(closeLlmChan)
  375. scanner := bufio.NewScanner(response.Body)
  376. scanner.Split(bufio.ScanLines)
  377. for scanner.Scan() {
  378. select {
  379. case <-closeLlmChan:
  380. return
  381. default:
  382. line := scanner.Text()
  383. if line == "" {
  384. continue
  385. }
  386. // 忽略 "ping" 行
  387. if strings.HasPrefix(line, ": ping") {
  388. continue
  389. }
  390. // 去除 "data: " 前缀
  391. if strings.HasPrefix(line, "data: ") {
  392. line = strings.TrimPrefix(line, "data: ")
  393. }
  394. var chunk eta_llm_http.ChunkResponse
  395. if err := json.Unmarshal([]byte(line), &chunk); err != nil {
  396. fmt.Println("解析错误的line:" + line)
  397. errChan <- fmt.Errorf("解析 JSON 块失败: %w", err)
  398. return
  399. }
  400. // 处理每个 chunk
  401. if chunk.Choices != nil && len(chunk.Choices) > 0 {
  402. for _, choice := range chunk.Choices {
  403. if choice.Delta.Content != "" {
  404. contentChan <- choice.Delta.Content
  405. }
  406. }
  407. }
  408. }
  409. }
  410. if err := scanner.Err(); err != nil {
  411. errChan <- fmt.Errorf("读取响应体失败: %w", err)
  412. return
  413. }
  414. }()
  415. return
  416. }