task.go 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411
  1. package services
  2. import (
  3. "fmt"
  4. "github.com/PuerkitoBio/goquery"
  5. "github.com/beego/beego/v2/task"
  6. "hongze/hongze_cygx/models"
  7. "hongze/hongze_cygx/utils"
  8. "html"
  9. "strconv"
  10. "strings"
  11. "time"
  12. )
  13. func Task() {
  14. fmt.Println("start")
  15. //同步数据
  16. if utils.RunMode == "release" {
  17. syncTacticsListAddreport := task.NewTask("syncTacticsListAddreport", "0 */5 * * * *", SyncTacticsListAddreport) //同步文章
  18. task.AddTask("syncTacticsListAddreport", syncTacticsListAddreport)
  19. getSummarytoEs := task.NewTask("getSummarytoEs", "0 */30 * * * *", GetSummarytoEs) //同步纪要库内容到Es
  20. task.AddTask("getSummarytoEs", getSummarytoEs)
  21. } else {
  22. getArticleListByApi := task.NewTask("getArticleListByApi", "0 */5 * * * *", GetArticleListByApi) //通过三方接口获取策略平台上的文章
  23. task.AddTask("getArticleListByApi", getArticleListByApi)
  24. }
  25. //修改任务状态
  26. updateActivitySattus := task.NewTask("syncTacticsListAddreport", "0 */1 8-22 * * *", UpdateActivitySattus)
  27. task.AddTask("updateActivitySattus", updateActivitySattus)
  28. //更新深 和新的标签
  29. updateIndustrialManagementLabel := task.NewTask("updateIndustrialManagementLabel", "0 */30 * * * *", UpdateIndustrialManagementLabel)
  30. task.AddTask("updateIndustrialManagementLabel", updateIndustrialManagementLabel)
  31. //更新报告的搜索栏内容
  32. //UpdateIndustrialManagementSubjectNnames()
  33. //会议提醒模板消息推送
  34. sendActivityBeginMsg := task.NewTask("sendActivityBeginMsg", "0 */10 8-22 * * *", SendActivityBeginMsg) //会议前60分钟的提醒
  35. task.AddTask("sendActivityBeginMsg", sendActivityBeginMsg)
  36. sendActivityBeginMsgMeeting := task.NewTask("sendActivityBeginMsgMeeting", "0 */5 8-22 * * *", SendActivityBeginMsgMeeting) //会议前15分钟的提醒
  37. task.AddTask("sendActivityBeginMsgMeeting", sendActivityBeginMsgMeeting)
  38. //预约外呼名单,会前1小时自动发送邮件给专家组
  39. sendEmailFileToExpert := task.NewTask("sendEmailFileToExpert", "0 */5 8-22 * * *", SendEmailFileToExpert) //预约外呼名单,会前1小时自动发送邮件给专家组
  40. task.AddTask("sendEmailFileToExpert", sendEmailFileToExpert)
  41. sendEmailFileForAskMsgResearch := task.NewTask("sendEmailFileForAskMsgResearch", "0 */5 8-22 * * *", SendEmailFileForAskMsgResearch) //研选系列专家电话会,会前1小时将问题列表发送给邮箱
  42. task.AddTask("sendEmailFileForAskMsgResearch", sendEmailFileForAskMsgResearch)
  43. sendEmailFileForAskMsg := task.NewTask("sendEmailFileForAskMsg", "0 */5 8-22 * * *", SendEmailFileForAskMsg) //非研选系列专家电话会,根据主持人姓名,会前15分钟将问题列表发送给至该主持人对应邮箱
  44. task.AddTask("sendEmailFileForAskMsg", sendEmailFileForAskMsg)
  45. //白名单发送2
  46. sendEmailUserWhiteListChange := task.NewTask("sendEmailUserWhiteListChange", "0 00 17 * * *", SendEmailUserWhiteListChange) //新增 和冻结的客户白名单
  47. task.AddTask("sendEmailUserWhiteListChange", sendEmailUserWhiteListChange)
  48. //更改对应产业的文章阅读数量
  49. chageIndustrialArticleNum := task.NewTask("chageIndustrialArticleNum", "0 01 00 * * *", ChageIndustrialArticleNum) //更改对应产业的文章阅读数量
  50. task.AddTask("chageIndustrialArticleNum", chageIndustrialArticleNum)
  51. //IndustrialArticleNum()
  52. //GetAddpArticle() //同步日度点评数据
  53. task.StartTask()
  54. fmt.Println("end")
  55. }
  56. ////白名单发送
  57. //sendEmailUserWhiteList := task.NewTask("sendEmailUserWhiteList", "0 27 17 * * *", SendEmailUserWhiteList) //白名单发送
  58. //task.AddTask("sendEmailUserWhiteList", sendEmailUserWhiteList)
  59. //editOutboundMobile := task.NewTask("editOutboundMobile", "0 */1 8-22 * * *", EditOutboundMobile) //同步外呼号码与手机号
  60. //task.AddTask("sendEmailFileToExpert", editOutboundMobile)
  61. //editUserOutboundMobile := task.NewTask("editUserOutboundMobile", "0 27 14 * * * ", EditUserOutboundMobile) //同步外呼号码与手机号
  62. //task.AddTask("editUserOutboundMobile", editUserOutboundMobile)
  63. func ElasticOption() {
  64. //SyncTacticsList()
  65. //toolbox.StartTask()
  66. //keyWord := "专家"
  67. //pageSize := 20
  68. //SearchByKeyWord(keyWord, pageSize)
  69. //SaveData()
  70. //GetIndustryMap()
  71. //解析报告
  72. //GetArticleExpert()
  73. //SearchByKeyWordQuery("")
  74. //AddMap()
  75. //同步数据
  76. //ImportData()
  77. //AddMap()
  78. //Search("光伏行业")
  79. //修复报告内容
  80. //GetArticleAll()
  81. //indexName := "article_list"
  82. // mappingJson := `{
  83. //"mappings": {
  84. // "dynamic": true,
  85. // "properties": {
  86. // "ArticleId": {
  87. // "type": "integer"
  88. // },
  89. // "Title": {
  90. // "type": "text",
  91. // "analyzer": "ik_smart"
  92. // },
  93. // "TitleEn": {
  94. // "type": "text",
  95. // "analyzer": "ik_smart"
  96. // },
  97. // "UpdateFrequency": {
  98. // "type": "text",
  99. // "analyzer": "ik_smart"
  100. // },
  101. // "CreateDate": {
  102. // "type": "text",
  103. // "analyzer": "ik_smart"
  104. // },
  105. // "PublishDate": {
  106. // "type": "text",
  107. // "analyzer": "ik_smart"
  108. // },
  109. // "Abstract": {
  110. // "type": "text",
  111. // "analyzer": "ik_smart"
  112. // },
  113. // "CategoryName": {
  114. // "type": "text",
  115. // "analyzer": "ik_smart"
  116. // },
  117. // "SubCategoryName": {
  118. // "type": "text",
  119. // "analyzer": "ik_smart"
  120. // },
  121. // "InterviewDate": {
  122. // "type": "text",
  123. // "analyzer": "ik_smart"
  124. // },
  125. // "ExpertBackground": {
  126. // "type": "text",
  127. // "analyzer": "ik_smart"
  128. // },
  129. // "ExpertNumber": {
  130. // "type": "text",
  131. // "analyzer": "ik_smart"
  132. // },
  133. // "Department": {
  134. // "type": "text",
  135. // "analyzer": "ik_smart"
  136. // },
  137. // "BodyText": {
  138. // "type": "text",
  139. // "analyzer": "ik_smart"
  140. // },
  141. // "ArticleIdMd5": {
  142. // "type": "text",
  143. // "analyzer": "ik_smart"
  144. // }
  145. // }
  146. //}
  147. //}`
  148. //EsCreateIndex(indexName,mappingJson)
  149. //插入数据
  150. //allList, err := models.GetArticleAll()
  151. //if err != nil {
  152. // fmt.Println("GetArticleAll Err:", err.Error())
  153. // return
  154. //}
  155. //
  156. //indexName := "article_list"
  157. //
  158. //for _, v := range allList {
  159. // content := html.UnescapeString(v.Body)
  160. // doc, err := goquery.NewDocumentFromReader(strings.NewReader(content))
  161. // if err != nil {
  162. // fmt.Println("create doc err:", err.Error())
  163. // return
  164. // }
  165. // bodyText := doc.Text()
  166. //
  167. // item := new(ElasticArticleDetail)
  168. // item.ArticleId = v.ArticleId
  169. // item.Title = v.Title
  170. // item.TitleEn = v.TitleEn
  171. // item.UpdateFrequency = v.UpdateFrequency
  172. // item.CreateDate = v.CreateDate
  173. // item.PublishDate = v.PublishDate
  174. // item.Abstract = v.Abstract
  175. // item.CategoryName = v.CategoryName
  176. // item.SubCategoryName = v.SubCategoryName
  177. // item.InterviewDate = v.InterviewDate
  178. // item.ExpertBackground = v.ExpertBackground
  179. // item.ExpertNumber = v.ExpertNumber
  180. // item.Department = v.Department
  181. // item.ArticleIdMd5 = v.ArticleIdMd5
  182. // item.BodyText = bodyText
  183. // EsAddOrEditData(indexName, strconv.Itoa(v.ArticleId), item)
  184. //}
  185. //fmt.Println("bm")
  186. //bm, err := cache.NewCache("file", `{"CachePath":"./cache","FileSuffix":".cache", "EmbedExpiry": "120"}`)
  187. ////
  188. //if err != nil {
  189. // fmt.Println("false",err)
  190. //}
  191. ////fmt.Println(bm)
  192. //key:="put_key_one"
  193. ////bm.Put(key,1,1*time.Second)
  194. //b:=bm.IsExist(key)
  195. //fmt.Println(b)
  196. //同步策略文章
  197. //SyncTacticsList()
  198. //indexName := "article_list"
  199. //EsDeleteData(indexName,)
  200. }
  201. /*
  202. searchItem := new(models.SearchItem)
  203. searchItem.ArticleId, _ = strconv.Atoi(v.Id)
  204. searchItem.Body = v.Highlight["BodyText"]
  205. searchItem.Title = title
  206. searchItem.PublishDate = article.PublishDate
  207. */
  208. func CreateIndex() {
  209. indexName := "cygx_article_v4" //utils.IndexName
  210. mappingJson := `{
  211. "mappings": {
  212. "dynamic": true,
  213. "properties": {
  214. "ArticleId": {
  215. "type": "integer"
  216. },
  217. "BodyText": {
  218. "type": "text",
  219. "term_vector": "with_positions_offsets",
  220. "analyzer": "ik_smart"
  221. },
  222. "PublishDate": {
  223. "type": "keyword"
  224. },
  225. "SubCategoryName": {
  226. "type": "text",
  227. "term_vector": "with_positions_offsets",
  228. "analyzer": "ik_smart"
  229. },
  230. "Title": {
  231. "type": "text",
  232. "term_vector": "with_positions_offsets",
  233. "analyzer": "ik_smart"
  234. },
  235. "TitleEn": {
  236. "type": "text",
  237. "term_vector": "with_positions_offsets"
  238. },
  239. "UpdateFrequency": {
  240. "type": "text",
  241. "term_vector": "with_positions_offsets"
  242. }
  243. }
  244. }
  245. }`
  246. EsCreateIndex(indexName, mappingJson)
  247. AddAllArticle()
  248. }
  249. func AddAllArticle() {
  250. endDate := time.Now().AddDate(0, 0, -30).Format(utils.FormatDate)
  251. //allList, err := models.GetArticleAll()
  252. allList, err := models.GetArticleAllDate(endDate)
  253. if err != nil {
  254. fmt.Println("GetArticleAll Err:", err.Error())
  255. return
  256. }
  257. indexName := utils.IndexName
  258. for _, v := range allList {
  259. content := html.UnescapeString(v.Body)
  260. doc, err := goquery.NewDocumentFromReader(strings.NewReader(content))
  261. if err != nil {
  262. fmt.Println("create doc err:", err.Error())
  263. return
  264. }
  265. bodyText := doc.Text()
  266. item := new(ElasticTestArticleDetail)
  267. item.ArticleId = v.ArticleId
  268. item.Title = v.Title
  269. item.PublishDate = v.PublishDate
  270. item.BodyText = bodyText
  271. EsAddOrEditData(indexName, strconv.Itoa(v.ArticleId), item)
  272. fmt.Println(v.ArticleId)
  273. }
  274. }
  275. func AddAllArticleV4() {
  276. allList, err := models.GetArticleAll2()
  277. if err != nil {
  278. fmt.Println("GetArticleAll Err:", err.Error())
  279. return
  280. }
  281. indexName := "cygx_article_v4"
  282. for _, v := range allList {
  283. content := html.UnescapeString(v.Body)
  284. doc, err := goquery.NewDocumentFromReader(strings.NewReader(content))
  285. if err != nil {
  286. fmt.Println("create doc err:", err.Error())
  287. return
  288. }
  289. bodyText := doc.Text()
  290. item := new(ElasticTestArticleDetailV4)
  291. item.ArticleId = v.ArticleId
  292. item.Title = v.Title
  293. item.PublishDate = v.PublishDate
  294. item.BodyText = bodyText
  295. item.IsSummary = v.IsSummary
  296. item.IsReport = v.IsReport
  297. //if v.IsReport == 1 {
  298. // item.IsReport = true
  299. //}
  300. //if v.IsSummary == 1 {
  301. // item.IsSummary = true
  302. //}
  303. EsAddOrEditDataV4(indexName, strconv.Itoa(v.ArticleId), item)
  304. fmt.Println(v.ArticleId)
  305. }
  306. }
  307. // "term_vector": "with_positions_offsets"
  308. type ElasticArticleDetail struct {
  309. ArticleId int `description:"报告id"`
  310. Title string `description:"标题"`
  311. TitleEn string `description:"英文标题 "`
  312. UpdateFrequency string `description:"更新周期"`
  313. CreateDate string `description:"创建时间"`
  314. PublishDate string `description:"发布时间"`
  315. Abstract string `description:"摘要"`
  316. CategoryName string `description:"一级分类"`
  317. SubCategoryName string `description:"二级分类"`
  318. InterviewDate string `description:"访谈时间"`
  319. ExpertBackground string `description:"专家背景"`
  320. ExpertNumber string `description:"专家编号"`
  321. Department string `description:"作者"`
  322. ArticleIdMd5 string `description:"纪要id"`
  323. BodyText string `description:"内容"`
  324. }
  325. type ElasticTestArticleDetail struct {
  326. ArticleId int `description:"报告id"`
  327. Title string `description:"标题"`
  328. BodyText string `description:"内容"`
  329. PublishDate string `description:"发布时间"`
  330. }
  331. type ElasticTestArticleDetailV4 struct {
  332. ArticleId int `description:"报告id"`
  333. Title string `description:"标题"`
  334. BodyText string `description:"内容"`
  335. PublishDate string `description:"发布时间"`
  336. IsSummary int `description:"是否属于纪要库"`
  337. IsReport int `description:"是否属于报告"`
  338. }
  339. func GetAddpArticle() {
  340. list, err := models.GetReportList()
  341. for _, v := range list {
  342. var articleId int
  343. maxArticleIdArticleInfo, errMax := models.GetMaxArticleIdInfo()
  344. if errMax != nil {
  345. fmt.Println(errMax)
  346. return
  347. }
  348. articleId = maxArticleIdArticleInfo.ArticleId + 1
  349. item := new(models.CygxArticle)
  350. item.Title = v.Title
  351. item.ArticleId = articleId
  352. item.SellerAndMobile = v.Author
  353. item.PublishDate = v.PublishTime
  354. item.Abstract = v.Abstract
  355. item.Body = html.UnescapeString(v.Content)
  356. item.BodyText, _ = GetReportContentTextSub(v.Content)
  357. item.IsReport = 1
  358. item.Source = 1
  359. item.ArticleIdMd5 = utils.MD5(strconv.Itoa(articleId))
  360. item.Department = "弘则产品组"
  361. item.ArticleType = "lyjh"
  362. item.IsClass = 1
  363. item.CreateDate = v.CreateTime
  364. item.UpdateFrequency = "unknow"
  365. item.CategoryId = 100 // 100是路演精华对应ID
  366. item.SubCategoryName = "路演精华"
  367. item.HavePublish = 1
  368. item.PublishStatus = 1
  369. item.Periods = strconv.Itoa(v.Stage)
  370. item.VideoUrl = v.VideoUrl
  371. item.VideoName = v.VideoName
  372. item.VideoPlaySeconds = v.VideoPlaySeconds
  373. newId, _ := models.AddCygxArticles(item)
  374. fmt.Println(articleId)
  375. fmt.Println(newId)
  376. fmt.Println(item.ArticleIdMd5)
  377. }
  378. fmt.Println(err)
  379. fmt.Println(list)
  380. }