12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849 |
- package services
- import (
- "fmt"
- "github.com/PuerkitoBio/goquery"
- "hongze/hongze_task/models"
- "hongze/hongze_task/utils"
- "html"
- "strings"
- )
- func FixReportContentSub() {
- items, err := models.GetReport()
- if err != nil {
- fmt.Println("err:", err.Error())
- return
- }
- for k, v := range items {
- fmt.Println(k, v.Id,v.ContentSub)
- content := html.UnescapeString(v.Content)
- utils.FileLog.Info("%s", content)
- doc, err := goquery.NewDocumentFromReader(strings.NewReader(content))
- if err != nil {
- fmt.Println("create doc err:", err.Error())
- return
- }
- n := 0
- contentSub := ""
- doc.Find("p").Each(func(i int, s *goquery.Selection) {
- if n >= 5 {
- return
- }
- n++
- phtml, err := s.Html()
- if err!=nil {
- fmt.Println("get html err",err.Error())
- return
- }
- if s.Text() != "" || strings.Contains(phtml, "src") {
- contentSub = contentSub + "<p>" + phtml + "</p>"
- utils.FileLog.Info("i:%d n:%d %s", i, n, contentSub)
- }
- })
- err = models.ModifyReportContentSub(v.Id, contentSub)
- if err != nil {
- fmt.Println("ModifyReportContentSub Err:" + err.Error())
- }
- }
- }
|