eta_llm_client.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439
  1. package eta_llm
  2. import (
  3. "bufio"
  4. "bytes"
  5. "encoding/json"
  6. "errors"
  7. "eta/eta_api/models"
  8. "eta/eta_api/utils"
  9. "eta/eta_api/utils/llm"
  10. "eta/eta_api/utils/llm/eta_llm/eta_llm_http"
  11. "fmt"
  12. "io"
  13. "mime/multipart"
  14. "net/http"
  15. "os"
  16. "strings"
  17. "sync"
  18. )
  19. var (
  20. dsOnce sync.Once
  21. etaLlmClient *ETALLMClient
  22. modelRouter = map[string]string{
  23. "deepseek-r1:32b": "/dsr1",
  24. "qwq:32b": "/qwq",
  25. }
  26. )
  27. const (
  28. KNOWLEDEG_CHAT_MODE = "local_kb"
  29. DEFALUT_PROMPT_NAME = "default"
  30. CONTENT_TYPE_JSON = "application/json"
  31. KNOWLEDGE_BASE_CHAT_API = "/chat/kb_chat"
  32. COMPLETION_CHAT_API = "/chat/chat/completions"
  33. DOCUMENT_CHAT_API = "/chat/file_chat"
  34. COMPLETION_CHAT_API = "/chat/chat/completions"
  35. KNOWLEDGE_BASE_SEARCH_DOCS_API = "/knowledge_base/search_docs"
  36. UPLOAD_TEMP_DOCS_API = "/knowledge_base/upload_temp_docs"
  37. )
  38. type ETALLMClient struct {
  39. *llm.LLMClient
  40. LlmModel string
  41. }
  42. type LLMConfig struct {
  43. LlmAddress string `json:"llm_server"`
  44. LlmModel string `json:"llm_model"`
  45. }
  46. func GetInstance() llm.LLMService {
  47. dsOnce.Do(func() {
  48. confStr := models.BusinessConfMap[models.LLMInitConfig]
  49. if confStr == "" {
  50. utils.FileLog.Error("LLM配置为空")
  51. return
  52. }
  53. var config LLMConfig
  54. err := json.Unmarshal([]byte(confStr), &config)
  55. if err != nil {
  56. utils.FileLog.Error("LLM配置错误")
  57. }
  58. if etaLlmClient == nil {
  59. etaLlmClient = &ETALLMClient{
  60. LLMClient: llm.NewLLMClient(config.LlmAddress, 300),
  61. LlmModel: config.LlmModel,
  62. }
  63. }
  64. })
  65. return etaLlmClient
  66. }
  67. func (ds *ETALLMClient) DocumentChat(query string, KnowledgeId string, history []json.RawMessage, stream bool) (llmRes *http.Response, err error) {
  68. ChatHistory := make([]eta_llm_http.HistoryContent, 0)
  69. for _, historyItemStr := range history {
  70. var historyItem eta_llm_http.HistoryContent
  71. parseErr := json.Unmarshal(historyItemStr, &historyItem)
  72. if parseErr != nil {
  73. continue
  74. }
  75. //str := strings.Split(historyItemStr, "-")
  76. //historyItem := eta_llm_http.HistoryContent{
  77. // Role: str[0],
  78. // Content: str[1],
  79. //}
  80. ChatHistory = append(ChatHistory, historyItem)
  81. }
  82. kbReq := eta_llm_http.DocumentChatRequest{
  83. Query: query,
  84. KnowledgeId: KnowledgeId,
  85. History: ChatHistory,
  86. TopK: 3,
  87. //ScoreThreshold: 0.5,
  88. ScoreThreshold: 2,
  89. Stream: stream,
  90. ModelName: ds.LlmModel,
  91. //Temperature: 0.7,
  92. Temperature: 0.01,
  93. MaxTokens: 0,
  94. //PromptName: DEFALUT_PROMPT_NAME,
  95. }
  96. //fmt.Printf("%v", kbReq.History)
  97. body, err := json.Marshal(kbReq)
  98. fmt.Println(string(body))
  99. if err != nil {
  100. return
  101. }
  102. return ds.DoStreamPost(DOCUMENT_CHAT_API, body)
  103. }
  104. func (ds *ETALLMClient) CompletionChat(query string, messages []json.RawMessage) (llmRes *http.Response, err error) {
  105. ChatHistory := make([]eta_llm_http.HistoryContent, 0)
  106. for _, historyItemStr := range messages {
  107. var historyItem eta_llm_http.HistoryContentWeb
  108. parseErr := json.Unmarshal(historyItemStr, &historyItem)
  109. if parseErr != nil {
  110. continue
  111. }
  112. ChatHistory = append(ChatHistory, eta_llm_http.HistoryContent{
  113. Content: historyItem.Content,
  114. Role: historyItem.Role,
  115. })
  116. }
  117. ChatHistory = append(ChatHistory, eta_llm_http.HistoryContent{
  118. Content: query,
  119. Role: "user",
  120. })
  121. kbReq := eta_llm_http.CompletionChatRequest{
  122. Mode: KNOWLEDEG_CHAT_MODE,
  123. Messages: ChatHistory,
  124. TopK: 3,
  125. ScoreThreshold: 0.5,
  126. Stream: true,
  127. Model: ds.LlmModel,
  128. Temperature: 0.7,
  129. MaxTokens: 0,
  130. PromptName: DEFALUT_PROMPT_NAME,
  131. ReturnDirect: false,
  132. }
  133. fmt.Printf("%v", kbReq.Messages)
  134. utils.FileLog.Info("kbReq.Messages: %v", kbReq.Messages)
  135. body, err := json.Marshal(kbReq)
  136. if err != nil {
  137. return
  138. }
  139. return ds.DoStreamPost(COMPLETION_CHAT_API, body)
  140. }
  141. func (ds *ETALLMClient) KnowledgeBaseChat(query string, KnowledgeBaseName string, history []json.RawMessage) (llmRes *http.Response, err error) {
  142. ChatHistory := make([]eta_llm_http.HistoryContent, 0)
  143. for _, historyItemStr := range history {
  144. var historyItem eta_llm_http.HistoryContentWeb
  145. parseErr := json.Unmarshal(historyItemStr, &historyItem)
  146. if parseErr != nil {
  147. continue
  148. }
  149. ChatHistory = append(ChatHistory, eta_llm_http.HistoryContent{
  150. Content: historyItem.Content,
  151. Role: historyItem.Role,
  152. })
  153. }
  154. kbReq := eta_llm_http.KbChatRequest{
  155. Query: query,
  156. Mode: KNOWLEDEG_CHAT_MODE,
  157. KbName: KnowledgeBaseName,
  158. History: ChatHistory,
  159. TopK: 3,
  160. ScoreThreshold: 0.5,
  161. Stream: true,
  162. Model: ds.LlmModel,
  163. Temperature: 0.7,
  164. MaxTokens: 0,
  165. PromptName: DEFALUT_PROMPT_NAME,
  166. ReturnDirect: false,
  167. }
  168. fmt.Printf("%v", kbReq.History)
  169. body, err := json.Marshal(kbReq)
  170. if err != nil {
  171. return
  172. }
  173. return ds.DoStreamPost(KNOWLEDGE_BASE_CHAT_API, body)
  174. }
  175. func (ds *ETALLMClient) FileChat(query string, KnowledgeId string, llmModel string, history []json.RawMessage) (resp eta_llm_http.BaseResponse, err error) {
  176. ChatHistory := make([]eta_llm_http.HistoryContent, 0)
  177. for _, historyItemStr := range history {
  178. var historyItem eta_llm_http.HistoryContentWeb
  179. parseErr := json.Unmarshal(historyItemStr, &historyItem)
  180. if parseErr != nil {
  181. continue
  182. }
  183. ChatHistory = append(ChatHistory, eta_llm_http.HistoryContent{
  184. Content: historyItem.Content,
  185. Role: historyItem.Role,
  186. })
  187. }
  188. var model string
  189. if llmModel != "" {
  190. model = llmModel
  191. } else {
  192. model = ds.LlmModel
  193. }
  194. kbReq := eta_llm_http.DocumentChatRequest{
  195. ModelName: model,
  196. Query: query,
  197. KnowledgeId: KnowledgeId,
  198. History: ChatHistory,
  199. TopK: 20,
  200. ScoreThreshold: 2,
  201. Stream: false,
  202. Temperature: 0.01,
  203. MaxTokens: 0,
  204. PromptName: DEFALUT_PROMPT_NAME,
  205. }
  206. body, err := json.Marshal(kbReq)
  207. if err != nil {
  208. utils.FileLog.Error("内容生成失败,序列化请求参数失败,err", err.Error())
  209. err = fmt.Errorf("内容生成失败,序列化请求参数失败,err:%v", err)
  210. return
  211. }
  212. return ds.DoPost(fmt.Sprintf("%s%s", modelRouter[model], DOCUMENT_CHAT_API), body)
  213. }
  214. func (ds *ETALLMClient) UploadFileToTemplate(files []*os.File, param map[string]interface{}) (data interface{}, err error) {
  215. var pervId string
  216. if value, ok := param["PrevId"]; ok {
  217. pervId = value.(string)
  218. }
  219. var model string
  220. if value, ok := param["LLM"]; ok {
  221. model = value.(string)
  222. } else {
  223. model = ds.LlmModel
  224. }
  225. docReq := eta_llm_http.UploadTempDocsRequest{
  226. ChunkOverlap: "150",
  227. ChunkSize: "750",
  228. PrevId: pervId,
  229. ZhTitleEnhance: "false",
  230. }
  231. body, err := json.Marshal(docReq)
  232. if err != nil {
  233. return
  234. }
  235. resp, err := ds.DoFile(fmt.Sprintf("%s%s", modelRouter[model], UPLOAD_TEMP_DOCS_API), body, files)
  236. if !resp.Success {
  237. err = errors.New(resp.Msg)
  238. return
  239. }
  240. if resp.Data != nil {
  241. var uploadDocsRes eta_llm_http.RagBaseResponse
  242. err = json.Unmarshal(resp.Data, &uploadDocsRes)
  243. if err != nil {
  244. err = errors.New("上传临时文件失败,err:" + err.Error())
  245. return
  246. }
  247. if uploadDocsRes.Code != 200 {
  248. err = errors.New("上传临时文件失败,err:" + uploadDocsRes.Msg)
  249. return
  250. }
  251. var uploadResult eta_llm_http.UploadDocsResponse
  252. err = json.Unmarshal(uploadDocsRes.Data, &uploadResult)
  253. if len(uploadResult.FiledFiles) > 0 {
  254. utils.FileLog.Warn("上传临时文件失败:", uploadResult.FiledFiles)
  255. }
  256. data = uploadResult
  257. return
  258. }
  259. return
  260. }
  261. func (ds *ETALLMClient) SearchKbDocs(query string, KnowledgeBaseName string) (content interface{}, err error) {
  262. kbReq := eta_llm_http.KbSearchDocsRequest{
  263. Query: query,
  264. KnowledgeBaseName: KnowledgeBaseName,
  265. TopK: 10,
  266. ScoreThreshold: 0.5,
  267. Metadata: struct{}{},
  268. }
  269. body, err := json.Marshal(kbReq)
  270. if err != nil {
  271. return
  272. }
  273. resp, err := ds.DoPost(KNOWLEDGE_BASE_SEARCH_DOCS_API, body)
  274. if !resp.Success {
  275. err = errors.New(resp.Msg)
  276. return
  277. }
  278. if resp.Data != nil {
  279. var kbSearchRes []eta_llm_http.SearchDocsResponse
  280. err = json.Unmarshal(resp.Data, &kbSearchRes)
  281. if err != nil {
  282. err = errors.New("搜索知识库失败")
  283. return
  284. }
  285. content = kbSearchRes
  286. return
  287. }
  288. err = errors.New("搜索知识库失败")
  289. return
  290. }
  291. func init() {
  292. err := llm.Register(llm.ETA_LLM_CLIENT, GetInstance())
  293. if err != nil {
  294. utils.FileLog.Error("注册eta_llm_server服务失败:", err)
  295. }
  296. }
  297. func (ds *ETALLMClient) DoPost(apiUrl string, body []byte) (baseResp eta_llm_http.BaseResponse, err error) {
  298. requestReader := bytes.NewReader(body)
  299. response, err := ds.HttpClient.Post(ds.BaseURL+apiUrl, CONTENT_TYPE_JSON, requestReader)
  300. if err != nil {
  301. return
  302. }
  303. return parseResponse(response)
  304. }
  305. func (ds *ETALLMClient) DoFile(apiUrl string, body []byte, files []*os.File) (baseResp eta_llm_http.BaseResponse, err error) {
  306. var requestBody bytes.Buffer
  307. writer := multipart.NewWriter(&requestBody)
  308. // 添加文件到请求体
  309. for _, file := range files {
  310. filePath, err := writer.CreateFormFile("files", file.Name())
  311. if err != nil {
  312. return baseResp, fmt.Errorf("创建文件表单字段失败: %w", err)
  313. }
  314. _, err = io.Copy(filePath, file)
  315. if err != nil {
  316. return baseResp, fmt.Errorf("写入文件内容失败: %w", err)
  317. }
  318. }
  319. var params = make(map[string]string)
  320. err = json.Unmarshal(body, &params)
  321. if err != nil {
  322. return
  323. }
  324. // 添加其他参数到请求体
  325. for key, value := range params {
  326. err := writer.WriteField(key, value)
  327. if err != nil {
  328. return baseResp, fmt.Errorf("写入表单字段失败: %w", err)
  329. }
  330. }
  331. // 关闭 writer,完成请求体的构建
  332. err = writer.Close()
  333. if err != nil {
  334. return baseResp, fmt.Errorf("关闭 multipart writer 失败: %w", err)
  335. }
  336. request, err := http.NewRequest("POST", ds.BaseURL+apiUrl, &requestBody)
  337. request.Header.Set("Content-Type", writer.FormDataContentType())
  338. response, err := ds.HttpClient.Do(request)
  339. if err != nil {
  340. return
  341. }
  342. return parseResponse(response)
  343. }
  344. func (ds *ETALLMClient) DoStreamPost(apiUrl string, body []byte) (baseResp *http.Response, err error) {
  345. requestReader := bytes.NewReader(body)
  346. return ds.HttpClient.Post(ds.BaseURL+apiUrl, CONTENT_TYPE_JSON, requestReader)
  347. }
  348. func parseResponse(response *http.Response) (baseResp eta_llm_http.BaseResponse, err error) {
  349. defer func() {
  350. _ = response.Body.Close()
  351. }()
  352. baseResp.Ret = response.StatusCode
  353. if response.StatusCode != http.StatusOK {
  354. baseResp.Msg = fmt.Sprintf("请求失败,状态码:%d, 状态信息:%s", response.StatusCode, http.StatusText(response.StatusCode))
  355. return
  356. }
  357. bodyBytes, err := io.ReadAll(response.Body)
  358. if err != nil {
  359. err = fmt.Errorf("读取响应体失败: %w", err)
  360. return
  361. }
  362. baseResp.Success = true
  363. baseResp.Data = bodyBytes
  364. return
  365. }
  366. func ParseStreamResponse(response *http.Response) (contentChan chan string, errChan chan error, closeChan chan struct{}, closeLlmChan chan bool) {
  367. contentChan = make(chan string, 10)
  368. errChan = make(chan error, 10)
  369. closeChan = make(chan struct{})
  370. closeLlmChan = make(chan bool, 1)
  371. go func() {
  372. defer close(contentChan)
  373. defer close(errChan)
  374. defer close(closeChan)
  375. defer close(closeLlmChan)
  376. scanner := bufio.NewScanner(response.Body)
  377. scanner.Split(bufio.ScanLines)
  378. for scanner.Scan() {
  379. select {
  380. case <-closeLlmChan:
  381. return
  382. default:
  383. line := scanner.Text()
  384. if line == "" {
  385. continue
  386. }
  387. // 忽略 "ping" 行
  388. if strings.HasPrefix(line, ": ping") {
  389. continue
  390. }
  391. // 去除 "data: " 前缀
  392. if strings.HasPrefix(line, "data: ") {
  393. line = strings.TrimPrefix(line, "data: ")
  394. }
  395. var chunk eta_llm_http.ChunkResponse
  396. if err := json.Unmarshal([]byte(line), &chunk); err != nil {
  397. fmt.Println("解析错误的line:" + line)
  398. errChan <- fmt.Errorf("解析 JSON 块失败: %w", err)
  399. return
  400. }
  401. // 处理每个 chunk
  402. if chunk.Choices != nil && len(chunk.Choices) > 0 {
  403. for _, choice := range chunk.Choices {
  404. if choice.Delta.Content != "" {
  405. contentChan <- choice.Delta.Content
  406. }
  407. }
  408. }
  409. }
  410. }
  411. if err := scanner.Err(); err != nil {
  412. errChan <- fmt.Errorf("读取响应体失败: %w", err)
  413. return
  414. }
  415. }()
  416. return
  417. }