elasticsearch.go 6.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235
  1. package services
  2. import (
  3. "context"
  4. "encoding/json"
  5. "fmt"
  6. "hongze/hongze_cygx/models"
  7. "hongze/hongze_cygx/utils"
  8. "html"
  9. "strconv"
  10. "strings"
  11. //"gopkg.in/olivere/elastic.v5"
  12. //"gopkg.in/olivere/elastic.v5/config"
  13. "github.com/PuerkitoBio/goquery"
  14. "github.com/olivere/elastic/v7"
  15. "github.com/olivere/elastic/v7/config"
  16. )
  17. const (
  18. ES_URL = "http://es-cn-nif227b580019rgw6.public.elasticsearch.aliyuncs.com:9200" //<1>
  19. ES_USERNAME = "elastic" //<2>
  20. ES_PASSWORD = "hongze@2021" //<3>
  21. //Grafana pwd-> 20521bb9
  22. //Grafana username-> emon
  23. )
  24. func SaveData() {
  25. //fmt.Println("start")
  26. var sniff = false //<4>
  27. cfg := &config.Config{
  28. URL: ES_URL,
  29. Username: ES_USERNAME,
  30. Password: ES_PASSWORD,
  31. }
  32. cfg.Sniff = &sniff
  33. var client, err = elastic.NewClientFromConfig(cfg)
  34. if err != nil {
  35. fmt.Println("NewClientFromConfig Err:" + err.Error())
  36. return
  37. }
  38. var esIndex = "cygx_article"
  39. //var esType = "article"
  40. //
  41. exists, err := client.IndexExists(esIndex).Do(context.Background()) //<5>
  42. if err != nil {
  43. fmt.Println("IndexExists Err:" + err.Error())
  44. return
  45. }
  46. if !exists {
  47. _, err = client.CreateIndex(esIndex).Do(context.Background())
  48. if err != nil {
  49. fmt.Println("CreateIndex Err:" + err.Error())
  50. return
  51. }
  52. }
  53. /*
  54. 3161,3190,3226,3244,3264,3285,3310,3334,3370,3397,3418,3446,3477,3497,3526,3554
  55. */
  56. idStr := `3584,3644`
  57. idArr := strings.Split(idStr, ",")
  58. for _, v := range idArr {
  59. id, _ := strconv.Atoi(v)
  60. item, err := models.GetArticleDetailById(id)
  61. if err != nil {
  62. fmt.Println("GetArticleDetailById Err:" + err.Error())
  63. return
  64. }
  65. content := html.UnescapeString(item.Body)
  66. doc, err := goquery.NewDocumentFromReader(strings.NewReader(content))
  67. if err != nil {
  68. fmt.Println("create doc err:", err.Error())
  69. return
  70. }
  71. bodyText := doc.Text()
  72. item.BodyText = bodyText
  73. //新增
  74. resp, err := client.Index().Index(esIndex).Id(strconv.Itoa(item.ArticleId)).BodyJson(item).Do(context.Background())
  75. if err != nil {
  76. fmt.Println("insert es failed", err.Error())
  77. return
  78. }
  79. fmt.Println(resp.Status)
  80. }
  81. /*
  82. //根据id查询
  83. searchById, err := client.Get().Index(esIndex).Type(esType).Id("3138").Do(context.Background())
  84. if searchById.Found {
  85. body, err := searchById.Source.MarshalJSON()
  86. fmt.Println("body:",string(body))
  87. fmt.Println(err)
  88. //var resultType models.ArticleDetail
  89. //if err := json.Unmarshal(searchById.Source,&resultType); err != nil{
  90. // log.Error(err.Error())
  91. //}
  92. //fmt.Printf("search by id: %#v \n",resultType)
  93. }
  94. */
  95. ////查询index中所有的数据
  96. //var resultType models.CygxArticle
  97. //searchAll,err := client.Search(esIndex).Type(esType).Do(context.Background())
  98. //for _,item := range searchAll.Each(reflect.TypeOf(resultType)) {
  99. // language := item.(models.CygxArticle)
  100. // fmt.Printf("search by index all: %#v \n",language)
  101. //}
  102. //根据检索条件查询
  103. // boolquery := elastic.NewBoolQuery()
  104. // boolquery.Should(elastic.NewMatchQuery("Body", "专家"))
  105. // highlight := elastic.NewHighlight()
  106. // highlight = highlight.Fields(elastic.NewHighlighterField("Body"))
  107. // highlight = highlight.PreTags("<font color='red'>").PostTags("</font>")
  108. // var pageSize int
  109. // pageSize = 20
  110. // searchByMatch, err := client.Search(esIndex).Highlight(highlight).Size(pageSize).Query(boolquery).Do(context.Background())
  111. // var result string
  112. // if searchByMatch.Hits != nil {
  113. // }
  114. // //fmt.Println(string(result))
  115. // utils.FileLog.Info("%s", string(result))
  116. //var resultType models.CygxArticle
  117. //for k,item := range searchByMatch.Each(reflect.TypeOf(resultType)) {
  118. // language := item.(models.CygxArticle)
  119. // fmt.Printf("search by match: %#v \n",language)
  120. //
  121. // fmt.Println(k)
  122. // result,err:=json.Marshal(language)
  123. // fmt.Println(err)
  124. // utils.FileLog.Info("%s",string(result))
  125. //}
  126. // Perform the search request.
  127. //searchByMatch, err := client.Search(esIndex).Type(esType).Query(query).From(1).Size(10).Do(context.Background())
  128. fmt.Println("end")
  129. }
  130. func SearchByKeyWord(keyWord,categoryName string, pageSize int) (result []*models.SearchItem, err error) {
  131. if pageSize == 0 {
  132. pageSize = 20
  133. }
  134. var sniff = false //<4>
  135. cfg := &config.Config{
  136. URL: ES_URL,
  137. Username: ES_USERNAME,
  138. Password: ES_PASSWORD,
  139. }
  140. cfg.Sniff = &sniff
  141. client, err := elastic.NewClientFromConfig(cfg)
  142. if err != nil {
  143. return
  144. }
  145. var esIndex = "cygx_article"
  146. termsQuery:=elastic.NewTermsQuery("category_name",categoryName)
  147. boolquery := elastic.NewBoolQuery()
  148. fmt.Println("get start keyWordArr")
  149. keyWordArr, err := GetIndustryMapNameSlice(keyWord)
  150. if err != nil {
  151. go utils.SendEmail(utils.APPNAME+" "+utils.RunMode+"异常提醒:", "GetIndustryMapNameSlice:"+err.Error(), utils.EmailSendToUsers)
  152. }
  153. keyWordArr = append(keyWordArr, keyWord)
  154. fmt.Println(keyWord)
  155. fmt.Println(keyWordArr)
  156. var newKeyWordArr []string
  157. if len(keyWordArr) > 2 {
  158. newKeyWordArr = append(keyWordArr[2:], keyWordArr[0:2]...)
  159. }
  160. fmt.Println(newKeyWordArr)
  161. fmt.Println("get end keyWordArr")
  162. searchMap := make(map[int]int)
  163. for k, v := range newKeyWordArr {
  164. fmt.Println(k, v)
  165. boolquery.Must(elastic.NewMatchQuery("Title", keyWord), elastic.NewMatchQuery("BodyText", keyWord))
  166. highlight := elastic.NewHighlight()
  167. highlight = highlight.Fields(elastic.NewHighlighterField("Title"), elastic.NewHighlighterField("BodyText"))
  168. highlight = highlight.PreTags("<font color='red'>").PostTags("</font>")
  169. searchByMatch, err := client.Search(esIndex).Highlight(highlight).Size(pageSize).Query(termsQuery).Query(boolquery).Do(context.Background())
  170. if err != nil {
  171. return result, err
  172. }
  173. if searchByMatch.Hits != nil {
  174. for _, v := range searchByMatch.Hits.Hits {
  175. articleJson, err := v.Source.MarshalJSON()
  176. if err != nil {
  177. return nil, err
  178. }
  179. article := new(models.CygxArticle)
  180. err = json.Unmarshal(articleJson, &article)
  181. if err != nil {
  182. return nil, err
  183. }
  184. if _, ok := searchMap[article.ArticleId]; !ok {
  185. searchItem := new(models.SearchItem)
  186. searchItem.ArticleId, _ = strconv.Atoi(v.Id)
  187. searchItem.Body = v.Highlight["BodyText"]
  188. var title string
  189. if len(v.Highlight["Title"]) > 0 {
  190. title = v.Highlight["Title"][0]
  191. } else {
  192. title = article.Title
  193. }
  194. searchItem.Title = title
  195. searchItem.PublishDate = article.PublishDate
  196. result = append(result, searchItem)
  197. searchMap[article.ArticleId] = article.ArticleId
  198. }
  199. }
  200. }
  201. }
  202. return
  203. }