imap.go 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460
  1. package mail
  2. import (
  3. "errors"
  4. "eta/eta_email_analysis/global"
  5. "eta/eta_email_analysis/models/report"
  6. "eta/eta_email_analysis/utils"
  7. "fmt"
  8. "github.com/emersion/go-imap"
  9. "github.com/emersion/go-imap/client"
  10. "github.com/emersion/go-message"
  11. "github.com/emersion/go-message/mail"
  12. "github.com/h2non/filetype"
  13. "io"
  14. "log"
  15. "os"
  16. "path"
  17. "strings"
  18. "time"
  19. )
  20. type MailMessage struct {
  21. Date time.Time `description:"收件时间"`
  22. Uid uint32 `description:"该邮件在邮箱中的唯一id"`
  23. FromAddress string `description:"发件人邮箱"`
  24. From string `description:"发件人名称"`
  25. Title string `description:"邮件标题"`
  26. Content string `description:"邮件主体正文"`
  27. Resources map[string]string `description:"正文内嵌资源"`
  28. Attachment map[string]string `description:"附件资源"`
  29. }
  30. func ListenMail(mailAddress, folder, userName, password string, readBatchSize, fromEmailIndex int, mailMessageChan chan MailMessage, mailMessageDoneChan chan bool) (err error) { // 收件箱
  31. defer func() {
  32. // 处理结束
  33. mailMessageDoneChan <- true
  34. if err != nil {
  35. fmt.Println("err:", err.Error())
  36. }
  37. }()
  38. // 建立与 IMAP 服务器的连接
  39. c, err := client.DialTLS(mailAddress, nil)
  40. if err != nil {
  41. fmt.Printf("连接 IMAP 服务器失败: %+v \n", err)
  42. return
  43. }
  44. // 最后一定不要忘记退出登录
  45. defer func() {
  46. _ = c.Logout()
  47. }()
  48. // 登录
  49. if err = c.Login(userName, password); err != nil {
  50. fmt.Printf("邮箱[%s] 登录失败: %v \n", fmt.Sprintf("%s:%s", userName, mailAddress), err)
  51. return
  52. }
  53. // 列出当前邮箱中的文件夹
  54. mailboxes := make(chan *imap.MailboxInfo, 10)
  55. done := make(chan error, 1) // 记录错误的 chan
  56. go func() {
  57. done <- c.List("", "*", mailboxes)
  58. }()
  59. log.Println("-->当前邮箱的文件夹 Mailboxes:")
  60. var folderExists bool
  61. for m := range mailboxes {
  62. log.Println("* ", m.Name)
  63. if m.Name == folder {
  64. folderExists = true
  65. }
  66. }
  67. err = <-done
  68. if err != nil {
  69. global.LOG.Errorf("列出邮箱列表时,出现错误:%v \n", err)
  70. return
  71. }
  72. log.Println("-->列出邮箱列表完毕!")
  73. if !folderExists {
  74. err = errors.New(fmt.Sprintf("文件夹[%s] 不存在 \n", folder))
  75. return
  76. }
  77. message.CharsetReader = myCharsetReader
  78. // 选择指定的文件夹
  79. mbox, err := c.Select(folder, false)
  80. if err != nil {
  81. err = errors.New(fmt.Sprintf("选择邮件箱失败: %+v", err))
  82. return
  83. }
  84. //log.Printf("mbox %+v \n", mbox)
  85. log.Printf("当前文件夹[%s]中,总共有 %d 封邮件 \n", folder, mbox.Messages)
  86. if mbox.Messages == 0 {
  87. //log.Fatalf("当前文件夹[%s]中没有邮件", folder)
  88. return
  89. }
  90. // 创建一个序列集,用于批量读取邮件
  91. seqSet := new(imap.SeqSet)
  92. to := mbox.Messages // 此文件下的邮件总数
  93. //minIndex := uint32(5)
  94. //// 假设需要获取最后4封邮件时
  95. //if fromEmailIndex > 0 {
  96. // minIndex = uint32(fromEmailIndex)
  97. //} else {
  98. // var maxNum uint32
  99. // //该次监听获取的最大数量
  100. // maxNum = 20000
  101. // //获取开始的邮件编号
  102. // if to > maxNum {
  103. // minIndex = to - maxNum + 1
  104. // }
  105. //}
  106. //from = 310
  107. var isStopFor bool
  108. step := uint32(1)
  109. for i := to; i >= 1; {
  110. start := i - step + 1
  111. if start < 0 {
  112. start = 1
  113. }
  114. //fmt.Printf("当前剩余%d封邮件待处理\n", i-minIndex+1)
  115. seqSet.Clear()
  116. seqSet.AddRange(start, i) // 添加指定范围内的邮件编号
  117. // 获取整个消息正文
  118. // imap.FetchEnvelope:请求获取邮件的信封数据(例如发件人、收件人、主题等元数据)。
  119. // imap.FetchRFC822:请求获取完整的邮件内容,包括所有头部和正文。
  120. items := []imap.FetchItem{imap.FetchFlags, imap.FetchEnvelope, imap.FetchRFC822}
  121. // 获取邮件内容 Start
  122. messages := make(chan *imap.Message, readBatchSize) // 创建一个通道,用于接收邮件消息
  123. fetchDone := make(chan error, 1) // 创建一个通道,用于接收错误消息
  124. go func() {
  125. // Fetch方法用于从服务器获取邮件数据,这里请求了邮件的信封和完整内容
  126. fetchDone <- c.Fetch(seqSet, items, messages)
  127. }()
  128. err = <-fetchDone
  129. if err != nil {
  130. global.LOG.Errorf("获取邮件信息出现错误:%v \n", err)
  131. return
  132. }
  133. // 获取邮件内容 End
  134. //log.Println("开始读取邮件内容")
  135. for msg := range messages {
  136. // 如果需要终止,那么就不处理了
  137. if isStopFor {
  138. continue
  139. }
  140. emailMessage, isRead, tmpErr := readEveryMsg(msg)
  141. if tmpErr != nil {
  142. // 移除本地文件
  143. {
  144. for _, v := range emailMessage.Attachment {
  145. os.Remove(v)
  146. }
  147. for _, v := range emailMessage.Resources {
  148. os.Remove(v)
  149. }
  150. }
  151. global.FILE_LOG.Errorf("读取邮件内容时出现错误:%v \n", tmpErr)
  152. continue
  153. }
  154. // 如果没有取到,那么就过滤
  155. if !isRead {
  156. continue
  157. }
  158. // 判断当前邮件id是否小于等于已经监听到的最小id,如果是,那么就不处理了
  159. if emailMessage.Uid <= uint32(fromEmailIndex) {
  160. isStopFor = true
  161. continue
  162. }
  163. // 如果取到了,那么写入待处理chan
  164. // 写入邮件处理chan
  165. mailMessageChan <- emailMessage
  166. }
  167. if isStopFor {
  168. // 已经找到了最小的邮件id,那么就退出循环了
  169. }
  170. //time.Sleep(time.Second * 5) // 休眠10秒
  171. i = i - step
  172. }
  173. log.Println("读取了所有邮件,完毕!")
  174. return
  175. }
  176. // document link: https://github.com/emersion/go-imap/wiki/Fetching-messages
  177. func readEveryMsg(msg *imap.Message) (emailMessage MailMessage, ok bool, err error) {
  178. ok = true
  179. defer func() {
  180. if err != nil {
  181. ok = false
  182. global.FILE_LOG.Errorf("邮件读取失败;Err:%s", err.Error())
  183. }
  184. }()
  185. message.CharsetReader = myCharsetReader
  186. emailMessage.Resources = make(map[string]string) // 内嵌资源
  187. emailMessage.Attachment = make(map[string]string) // 附件
  188. emailMessage.Uid = msg.Uid
  189. htmlStr := ``
  190. textStr := ``
  191. //log.Printf("当前邮件的消息序列号 %+v \n", msg.SeqNum)
  192. //log.Println("-------------------------")
  193. // 获取邮件正文
  194. r := msg.GetBody(&imap.BodySectionName{})
  195. if r == nil {
  196. global.FILE_LOG.Info("服务器没有返回消息内容")
  197. }
  198. mr, err := mail.CreateReader(r)
  199. if err != nil {
  200. //log.Fatalf("邮件读取时出现错误: %v \n", err)
  201. err = errors.New(fmt.Sprintf("邮件读取时出现错误:%v \n", err))
  202. return
  203. }
  204. // 收件时间
  205. {
  206. date, err := mr.Header.Date()
  207. if err != nil {
  208. log.Println("收件时间 异常:", err.Error())
  209. }
  210. emailMessage.Date = date
  211. //log.Println("收件时间 Date:", date)
  212. }
  213. // 发件人
  214. {
  215. fromStr := mr.Header.Get("From")
  216. //fmt.Println(fromStr)
  217. // 处理无效地址的情况
  218. if !strings.Contains(fromStr, "@") {
  219. emailMessage.FromAddress = fromStr
  220. emailMessage.From = fromStr
  221. } else {
  222. from, tmpErr := mr.Header.AddressList("From")
  223. if tmpErr != nil {
  224. log.Println("发件人 异常:", err.Error())
  225. }
  226. if len(from) > 0 {
  227. emailMessage.FromAddress = from[0].Address
  228. emailMessage.From = from[0].Name
  229. //mailMessage.From = from[0].String()
  230. //log.Println("发件人 From:", from)
  231. }
  232. }
  233. }
  234. //if to, err := mr.Header.AddressList("To"); err == nil {
  235. // log.Println("收件人 To:", to)
  236. //}
  237. //log.Printf("抄送 Cc: %+v \n", msg.Envelope.Cc)
  238. // 邮件标题
  239. subject, err := mr.Header.Subject()
  240. if err != nil {
  241. log.Println("邮件主题 Subject ERR:", err)
  242. } else {
  243. //log.Println("邮件主题 Subject:", subject)
  244. }
  245. emailMessage.Title = subject
  246. // 过滤
  247. if isIgnore(emailMessage) {
  248. ok = false
  249. return
  250. }
  251. //fmt.Println("当前邮件Uid:", emailMessage.Uid)
  252. //ok = false
  253. //return
  254. for {
  255. p, tmpErr := mr.NextPart()
  256. if tmpErr == io.EOF {
  257. break
  258. } else if tmpErr != nil {
  259. global.FILE_LOG.Errorf("读取邮件内容时出现错误:%v \n", tmpErr)
  260. err = tmpErr
  261. return
  262. }
  263. bodyBytes, _ := io.ReadAll(p.Body)
  264. if err != nil {
  265. //log.Fatalf("读取邮件部分时出现错误:%v \n", err)
  266. err = errors.New(fmt.Sprintf("读取邮件部分时出现错误:%v \n", err))
  267. return
  268. }
  269. switch h := p.Header.(type) {
  270. case *mail.InlineHeader:
  271. // 这是消息的文本(可以是纯文本或 HTML)
  272. contentType := h.Get("Content-Type")
  273. //log.Println("消息内容content-type:", contentType)
  274. if strings.HasPrefix(contentType, "text/plain") {
  275. //log.Printf("得到正文 -> TEXT: %v \n", string(bodyBytes))
  276. textStr += string(bodyBytes)
  277. } else if strings.HasPrefix(contentType, "text/html") {
  278. //log.Printf("得到正文 -> HTML: %v \n", len(b))
  279. //log.Printf("得到正文 -> HTML: %v \n", string(bodyBytes))
  280. htmlStr += string(bodyBytes)
  281. }
  282. // 这是内嵌资源
  283. if cid := p.Header.Get("Content-ID"); cid != "" {
  284. // 确定文件后缀
  285. fileSuffix := determineFileSuffix(bodyBytes)
  286. fileName := fmt.Sprintf("%s%s.%s", global.CONFIG.Serve.StaticDir, cid[1:len(cid)-1], fileSuffix)
  287. err = utils.SaveToFile(bodyBytes, fileName)
  288. if err != nil {
  289. //log.Fatalf("保存文件时出现错误:%v \n", err)
  290. err = errors.New(fmt.Sprintf("保存文件时出现错误:%v \n", err))
  291. return
  292. }
  293. emailMessage.Resources[cid] = fileName
  294. }
  295. break
  296. case *mail.AttachmentHeader:
  297. // 这是一个附件
  298. filename, _ := h.Filename()
  299. //log.Printf("得到附件: %v,content-type:%s \n", filename, p.Header.Get("Content-Type"))
  300. saveName := fmt.Sprint(msg.SeqNum, utils.MD5(filename), time.Now().Format(utils.FormatDateTimeUnSpace), time.Now().Nanosecond(), path.Ext(filename))
  301. filePath := fmt.Sprintf("%s%s%s%s", global.CONFIG.Serve.StaticDir, `file`, string(os.PathSeparator), saveName)
  302. err = utils.SaveToFile(bodyBytes, filePath)
  303. if err != nil {
  304. //log.Fatalf("保存文件时出现错误:%v \n", err)
  305. err = errors.New(fmt.Sprintf("保存文件时出现错误:%v \n", err))
  306. return
  307. }
  308. // 这是附件资源
  309. if contentDisposition := p.Header.Get("Content-Disposition"); contentDisposition != "" {
  310. if strings.HasPrefix(contentDisposition, "attachment") {
  311. emailMessage.Attachment[filename] = filePath
  312. }
  313. } else if cid := p.Header.Get("Content-ID"); cid != "" {
  314. // 这是内嵌资源
  315. emailMessage.Resources[cid] = filePath
  316. }
  317. //else {
  318. // mailMessage.Attachment[filename] = filePath
  319. //}
  320. break
  321. default:
  322. global.FILE_LOG.Info("未知格式:", h)
  323. //log.Println(h)
  324. }
  325. }
  326. emailMessage.Content = htmlStr
  327. if emailMessage.Content == `` {
  328. emailMessage.Content = textStr
  329. }
  330. //log.Println("一封邮件读取完毕")
  331. //log.Printf("------------------------- \n\n")
  332. return
  333. }
  334. // 根据文件内容确定文件后缀
  335. func determineFileSuffix(content []byte) string {
  336. kind, err := filetype.Match(content)
  337. if err != nil {
  338. global.FILE_LOG.Error("无法确定文件类型:%v \n", err)
  339. return ".bin"
  340. }
  341. return kind.Extension
  342. }
  343. // isIgnore
  344. // @Description: 校验是否忽略的邮件
  345. // @author: Roc
  346. // @datetime 2024-09-30 16:09:34
  347. // @param emailMessage MailMessage
  348. // @return bool
  349. func isIgnore(emailMessage MailMessage) bool {
  350. // 发件人中包含待过滤的字符串,那么就过滤
  351. lowerFrom := strings.ToLower(emailMessage.From)
  352. for _, email := range global.CONFIG.Email.IgnoreEmail {
  353. if utils.ContainsWholeWord(lowerFrom, email) {
  354. global.FILE_LOG.Infof("发件人包含%s,过滤掉,发件人:%s;标题:%s;所属下标:%d", email, emailMessage.From, emailMessage.Title, emailMessage.Uid)
  355. return true
  356. }
  357. }
  358. // 邮件标题中包含待过滤的字符串(大小写敏感的标题),那么就过滤
  359. for _, email := range global.CONFIG.Email.IgnoreEmailCaseSensitive {
  360. if utils.ContainsWholeWord(emailMessage.From, email) {
  361. global.FILE_LOG.Infof("发件人包含%s,过滤掉,发件人:%s;标题:%s;所属下标:%d", email, emailMessage.From, emailMessage.Title, emailMessage.Uid)
  362. return true
  363. }
  364. }
  365. // 发件人地址中包含待过滤的字符串,那么就过滤
  366. lowerFromAddress := strings.ToLower(emailMessage.FromAddress)
  367. for _, emailAddress := range global.CONFIG.Email.IgnoreEmailAddress {
  368. if utils.ContainsWholeWord(lowerFromAddress, emailAddress) {
  369. global.FILE_LOG.Infof("发件人邮箱包含%s,过滤掉,发件人邮箱地址:%s;标题:%s;所属下标:%d", emailAddress, emailMessage.FromAddress, emailMessage.Title, emailMessage.Uid)
  370. return true
  371. }
  372. }
  373. // 邮件地址中包含待过滤的字符串(大小写敏感的标题),那么就过滤
  374. for _, emailAddress := range global.CONFIG.Email.IgnoreEmailAddressCaseSensitive {
  375. if utils.ContainsWholeWord(emailMessage.FromAddress, emailAddress) {
  376. global.FILE_LOG.Infof("发件人邮箱包含%s,过滤掉,发件人邮箱地址:%s;标题:%s;所属下标:%d", emailAddress, emailMessage.FromAddress, emailMessage.Title, emailMessage.Uid)
  377. return true
  378. }
  379. }
  380. // 邮件标题中包含待过滤的字符串,那么就过滤
  381. lowerTitle := strings.ToLower(emailMessage.Title)
  382. for _, title := range global.CONFIG.Email.IgnoreEmailTitle {
  383. title = strings.ToLower(title)
  384. if utils.ContainsWholeWord(lowerTitle, title) {
  385. global.FILE_LOG.Infof("邮件标题包含%s,过滤掉,标题:%s,所属下标:%d", title, emailMessage.Title, emailMessage.Uid)
  386. return true
  387. }
  388. }
  389. // 邮件标题中包含待过滤的字符串(大小写敏感的标题),那么就过滤
  390. for _, title := range global.CONFIG.Email.IgnoreEmailTitleCaseSensitive {
  391. if utils.ContainsWholeWord(emailMessage.Title, title) {
  392. global.FILE_LOG.Infof("邮件标题包含%s,过滤掉,标题:%s,所属下标:%d", title, emailMessage.Title, emailMessage.Uid)
  393. return true
  394. }
  395. }
  396. return false
  397. }
  398. func RuleCheck(ruleList []report.MailRule, emailMessage MailMessage) bool {
  399. for _, v := range ruleList {
  400. title := strings.ToLower(emailMessage.Title)
  401. rule := strings.ToLower(v.Rule)
  402. if strings.Contains(title, rule){
  403. return true
  404. }
  405. }
  406. return false
  407. }