imap.go 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471
  1. package mail
  2. import (
  3. "errors"
  4. "eta/eta_email_analysis/global"
  5. "eta/eta_email_analysis/models/report"
  6. "eta/eta_email_analysis/utils"
  7. "fmt"
  8. "github.com/emersion/go-imap"
  9. "github.com/emersion/go-imap/client"
  10. "github.com/emersion/go-message"
  11. "github.com/emersion/go-message/mail"
  12. "github.com/h2non/filetype"
  13. "io"
  14. "log"
  15. "os"
  16. "path"
  17. "strings"
  18. "time"
  19. )
  20. type MailMessage struct {
  21. Date time.Time `description:"收件时间"`
  22. Uid uint32 `description:"该邮件在邮箱中的唯一id"`
  23. FromAddress string `description:"发件人邮箱"`
  24. From string `description:"发件人名称"`
  25. Title string `description:"邮件标题"`
  26. Content string `description:"邮件主体正文"`
  27. Folder string `description:"所属文件夹"`
  28. Resources map[string]string `description:"正文内嵌资源"`
  29. Attachment map[string]string `description:"附件资源"`
  30. }
  31. // IsHandleMessageIdMap 邮件id是否已经处理过了
  32. var IsHandleMessageIdMap = map[int]bool{}
  33. func ListenMail(mailAddress, folder, userName, password string, readBatchSize, fromEmailIndex int, mailMessageChan chan MailMessage, mailMessageDoneChan chan bool) (err error) { // 收件箱
  34. defer func() {
  35. // 处理结束
  36. mailMessageDoneChan <- true
  37. if err != nil {
  38. fmt.Println("err:", err.Error())
  39. }
  40. }()
  41. // 建立与 IMAP 服务器的连接
  42. c, err := client.DialTLS(mailAddress, nil)
  43. if err != nil {
  44. fmt.Printf("连接 IMAP 服务器失败: %+v \n", err)
  45. return
  46. }
  47. // 最后一定不要忘记退出登录
  48. defer func() {
  49. _ = c.Logout()
  50. }()
  51. // 登录
  52. if err = c.Login(userName, password); err != nil {
  53. fmt.Printf("邮箱[%s] 登录失败: %v \n", fmt.Sprintf("%s:%s", userName, mailAddress), err)
  54. return
  55. }
  56. // 列出当前邮箱中的文件夹
  57. mailboxes := make(chan *imap.MailboxInfo, 10)
  58. done := make(chan error, 1) // 记录错误的 chan
  59. go func() {
  60. done <- c.List("", "*", mailboxes)
  61. }()
  62. log.Println("-->当前邮箱的文件夹 Mailboxes:")
  63. var folderExists bool
  64. for m := range mailboxes {
  65. log.Println("* ", m.Name)
  66. if m.Name == folder {
  67. folderExists = true
  68. }
  69. }
  70. err = <-done
  71. if err != nil {
  72. global.LOG.Errorf("列出邮箱列表时,出现错误:%v \n", err)
  73. return
  74. }
  75. log.Println("-->列出邮箱列表完毕!")
  76. if !folderExists {
  77. err = errors.New(fmt.Sprintf("文件夹[%s] 不存在 \n", folder))
  78. return
  79. }
  80. message.CharsetReader = myCharsetReader
  81. // 选择指定的文件夹
  82. mbox, err := c.Select(folder, false)
  83. if err != nil {
  84. err = errors.New(fmt.Sprintf("选择邮件箱失败: %+v", err))
  85. return
  86. }
  87. //log.Printf("mbox %+v \n", mbox)
  88. log.Printf("当前文件夹[%s]中,总共有 %d 封邮件 \n", folder, mbox.Messages)
  89. if mbox.Messages == 0 {
  90. //log.Fatalf("当前文件夹[%s]中没有邮件", folder)
  91. return
  92. }
  93. // 创建一个序列集,用于批量读取邮件
  94. seqSet := new(imap.SeqSet)
  95. to := mbox.Messages // 此文件下的邮件总数
  96. //minIndex := uint32(5)
  97. //// 假设需要获取最后4封邮件时
  98. //if fromEmailIndex > 0 {
  99. // minIndex = uint32(fromEmailIndex)
  100. //} else {
  101. // var maxNum uint32
  102. // //该次监听获取的最大数量
  103. // maxNum = 20000
  104. // //获取开始的邮件编号
  105. // if to > maxNum {
  106. // minIndex = to - maxNum + 1
  107. // }
  108. //}
  109. //from = 310
  110. var isStopFor bool
  111. step := uint32(1)
  112. for i := to; i >= 1; {
  113. start := i - step + 1
  114. if start < 0 {
  115. start = 1
  116. }
  117. //fmt.Printf("当前剩余%d封邮件待处理\n", i-minIndex+1)
  118. seqSet.Clear()
  119. seqSet.AddRange(start, i) // 添加指定范围内的邮件编号
  120. // 获取整个消息正文
  121. // imap.FetchEnvelope:请求获取邮件的信封数据(例如发件人、收件人、主题等元数据)。
  122. // imap.FetchRFC822:请求获取完整的邮件内容,包括所有头部和正文。
  123. items := []imap.FetchItem{imap.FetchFlags, imap.FetchEnvelope, imap.FetchRFC822}
  124. // 获取邮件内容 Start
  125. messages := make(chan *imap.Message, readBatchSize) // 创建一个通道,用于接收邮件消息
  126. fetchDone := make(chan error, 1) // 创建一个通道,用于接收错误消息
  127. go func() {
  128. // Fetch方法用于从服务器获取邮件数据,这里请求了邮件的信封和完整内容
  129. fetchDone <- c.Fetch(seqSet, items, messages)
  130. }()
  131. err = <-fetchDone
  132. if err != nil {
  133. global.LOG.Errorf("获取邮件信息出现错误:%v \n", err)
  134. return
  135. }
  136. // 获取邮件内容 End
  137. //log.Println("开始读取邮件内容")
  138. for msg := range messages {
  139. // 如果需要终止,那么就不处理了
  140. if isStopFor {
  141. continue
  142. }
  143. emailMessage, isRead, tmpErr := readEveryMsg(msg, folder)
  144. if tmpErr != nil {
  145. // 移除本地文件
  146. {
  147. for _, v := range emailMessage.Attachment {
  148. os.Remove(v)
  149. }
  150. for _, v := range emailMessage.Resources {
  151. os.Remove(v)
  152. }
  153. }
  154. global.FILE_LOG.Errorf("读取邮件内容时出现错误:%v \n", tmpErr)
  155. continue
  156. }
  157. // 如果没有取到,那么就过滤
  158. if !isRead {
  159. continue
  160. }
  161. // 判断当前邮件id是否小于等于已经监听到的最小id,如果是,那么就不处理了
  162. if emailMessage.Uid <= uint32(fromEmailIndex) {
  163. isStopFor = true
  164. continue
  165. }
  166. // 如果取到了,那么写入待处理chan
  167. // 写入邮件处理chan
  168. mailMessageChan <- emailMessage
  169. }
  170. if isStopFor {
  171. // 已经找到了最小的邮件id,那么就退出循环了
  172. }
  173. //time.Sleep(time.Second * 5) // 休眠10秒
  174. i = i - step
  175. }
  176. log.Println("读取了所有邮件,完毕!")
  177. return
  178. }
  179. // document link: https://github.com/emersion/go-imap/wiki/Fetching-messages
  180. func readEveryMsg(msg *imap.Message, folder string) (emailMessage MailMessage, ok bool, err error) {
  181. ok = true
  182. defer func() {
  183. if err != nil {
  184. ok = false
  185. global.FILE_LOG.Errorf("邮件读取失败;Err:%s", err.Error())
  186. }
  187. }()
  188. message.CharsetReader = myCharsetReader
  189. emailMessage.Resources = make(map[string]string) // 内嵌资源
  190. emailMessage.Attachment = make(map[string]string) // 附件
  191. emailMessage.Uid = msg.Uid
  192. emailMessage.Folder = folder
  193. if IsHandleMessageIdMap != nil {
  194. if _, has := IsHandleMessageIdMap[int(emailMessage.Uid)]; has {
  195. fmt.Println("邮件已处理,邮件下标:", emailMessage.Uid)
  196. return
  197. }
  198. }
  199. htmlStr := ``
  200. textStr := ``
  201. //log.Printf("当前邮件的消息序列号 %+v \n", msg.SeqNum)
  202. //log.Println("-------------------------")
  203. // 获取邮件正文
  204. r := msg.GetBody(&imap.BodySectionName{})
  205. if r == nil {
  206. global.FILE_LOG.Info("服务器没有返回消息内容")
  207. }
  208. mr, err := mail.CreateReader(r)
  209. if err != nil {
  210. //log.Fatalf("邮件读取时出现错误: %v \n", err)
  211. err = errors.New(fmt.Sprintf("邮件读取时出现错误:%v \n", err))
  212. return
  213. }
  214. // 收件时间
  215. {
  216. date, err := mr.Header.Date()
  217. if err != nil {
  218. log.Println("收件时间 异常:", err.Error())
  219. }
  220. emailMessage.Date = date
  221. //log.Println("收件时间 Date:", date)
  222. }
  223. // 发件人
  224. {
  225. fromStr := mr.Header.Get("From")
  226. //fmt.Println(fromStr)
  227. // 处理无效地址的情况
  228. if !strings.Contains(fromStr, "@") {
  229. emailMessage.FromAddress = fromStr
  230. emailMessage.From = fromStr
  231. } else {
  232. from, tmpErr := mr.Header.AddressList("From")
  233. if tmpErr != nil {
  234. log.Println("发件人 异常:", err.Error())
  235. }
  236. if len(from) > 0 {
  237. emailMessage.FromAddress = from[0].Address
  238. emailMessage.From = from[0].Name
  239. //mailMessage.From = from[0].String()
  240. //log.Println("发件人 From:", from)
  241. }
  242. }
  243. }
  244. //if to, err := mr.Header.AddressList("To"); err == nil {
  245. // log.Println("收件人 To:", to)
  246. //}
  247. //log.Printf("抄送 Cc: %+v \n", msg.Envelope.Cc)
  248. // 邮件标题
  249. subject, err := mr.Header.Subject()
  250. if err != nil {
  251. log.Println("邮件主题 Subject ERR:", err)
  252. } else {
  253. //log.Println("邮件主题 Subject:", subject)
  254. }
  255. emailMessage.Title = subject
  256. // 过滤
  257. if isIgnore(emailMessage) {
  258. ok = false
  259. return
  260. }
  261. //fmt.Println("当前邮件Uid:", emailMessage.Uid)
  262. //ok = false
  263. //return
  264. for {
  265. p, tmpErr := mr.NextPart()
  266. if tmpErr == io.EOF {
  267. break
  268. } else if tmpErr != nil {
  269. global.FILE_LOG.Errorf("读取邮件内容时出现错误:%v \n", tmpErr)
  270. err = tmpErr
  271. return
  272. }
  273. bodyBytes, _ := io.ReadAll(p.Body)
  274. if err != nil {
  275. //log.Fatalf("读取邮件部分时出现错误:%v \n", err)
  276. err = errors.New(fmt.Sprintf("读取邮件部分时出现错误:%v \n", err))
  277. return
  278. }
  279. switch h := p.Header.(type) {
  280. case *mail.InlineHeader:
  281. // 这是消息的文本(可以是纯文本或 HTML)
  282. contentType := h.Get("Content-Type")
  283. //log.Println("消息内容content-type:", contentType)
  284. if strings.HasPrefix(contentType, "text/plain") {
  285. //log.Printf("得到正文 -> TEXT: %v \n", string(bodyBytes))
  286. textStr += string(bodyBytes)
  287. } else if strings.HasPrefix(contentType, "text/html") {
  288. //log.Printf("得到正文 -> HTML: %v \n", len(b))
  289. //log.Printf("得到正文 -> HTML: %v \n", string(bodyBytes))
  290. htmlStr += string(bodyBytes)
  291. }
  292. // 这是内嵌资源
  293. if cid := p.Header.Get("Content-ID"); cid != "" {
  294. // 确定文件后缀
  295. fileSuffix := determineFileSuffix(bodyBytes)
  296. fileName := fmt.Sprintf("%s%s.%s", global.CONFIG.Serve.StaticDir, cid[1:len(cid)-1], fileSuffix)
  297. err = utils.SaveToFile(bodyBytes, fileName)
  298. if err != nil {
  299. //log.Fatalf("保存文件时出现错误:%v \n", err)
  300. err = errors.New(fmt.Sprintf("保存文件时出现错误:%v \n", err))
  301. return
  302. }
  303. emailMessage.Resources[cid] = fileName
  304. }
  305. break
  306. case *mail.AttachmentHeader:
  307. // 这是一个附件
  308. filename, _ := h.Filename()
  309. //log.Printf("得到附件: %v,content-type:%s \n", filename, p.Header.Get("Content-Type"))
  310. saveName := fmt.Sprint(msg.SeqNum, utils.MD5(filename), time.Now().Format(utils.FormatDateTimeUnSpace), time.Now().Nanosecond(), path.Ext(filename))
  311. filePath := fmt.Sprintf("%s%s%s%s", global.CONFIG.Serve.StaticDir, `file`, string(os.PathSeparator), saveName)
  312. err = utils.SaveToFile(bodyBytes, filePath)
  313. if err != nil {
  314. //log.Fatalf("保存文件时出现错误:%v \n", err)
  315. err = errors.New(fmt.Sprintf("保存文件时出现错误:%v \n", err))
  316. return
  317. }
  318. // 这是附件资源
  319. if contentDisposition := p.Header.Get("Content-Disposition"); contentDisposition != "" {
  320. if strings.HasPrefix(contentDisposition, "attachment") {
  321. emailMessage.Attachment[filename] = filePath
  322. }
  323. } else if cid := p.Header.Get("Content-ID"); cid != "" {
  324. // 这是内嵌资源
  325. emailMessage.Resources[cid] = filePath
  326. }
  327. //else {
  328. // mailMessage.Attachment[filename] = filePath
  329. //}
  330. break
  331. default:
  332. global.FILE_LOG.Info("未知格式:", h)
  333. //log.Println(h)
  334. }
  335. }
  336. emailMessage.Content = htmlStr
  337. if emailMessage.Content == `` {
  338. emailMessage.Content = textStr
  339. }
  340. //log.Println("一封邮件读取完毕")
  341. //log.Printf("------------------------- \n\n")
  342. return
  343. }
  344. // 根据文件内容确定文件后缀
  345. func determineFileSuffix(content []byte) string {
  346. kind, err := filetype.Match(content)
  347. if err != nil {
  348. global.FILE_LOG.Error("无法确定文件类型:%v \n", err)
  349. return ".bin"
  350. }
  351. return kind.Extension
  352. }
  353. // isIgnore
  354. // @Description: 校验是否忽略的邮件
  355. // @author: Roc
  356. // @datetime 2024-09-30 16:09:34
  357. // @param emailMessage MailMessage
  358. // @return bool
  359. func isIgnore(emailMessage MailMessage) bool {
  360. // 发件人中包含待过滤的字符串,那么就过滤
  361. lowerFrom := strings.ToLower(emailMessage.From)
  362. for _, email := range global.CONFIG.Email.IgnoreEmail {
  363. if utils.ContainsWholeWord(lowerFrom, email) {
  364. global.FILE_LOG.Infof("发件人包含%s,过滤掉,发件人:%s;标题:%s;所属下标:%d", email, emailMessage.From, emailMessage.Title, emailMessage.Uid)
  365. return true
  366. }
  367. }
  368. // 邮件标题中包含待过滤的字符串(大小写敏感的标题),那么就过滤
  369. for _, email := range global.CONFIG.Email.IgnoreEmailCaseSensitive {
  370. if utils.ContainsWholeWord(emailMessage.From, email) {
  371. global.FILE_LOG.Infof("发件人包含%s,过滤掉,发件人:%s;标题:%s;所属下标:%d", email, emailMessage.From, emailMessage.Title, emailMessage.Uid)
  372. return true
  373. }
  374. }
  375. // 发件人地址中包含待过滤的字符串,那么就过滤
  376. lowerFromAddress := strings.ToLower(emailMessage.FromAddress)
  377. for _, emailAddress := range global.CONFIG.Email.IgnoreEmailAddress {
  378. if utils.ContainsWholeWord(lowerFromAddress, emailAddress) {
  379. global.FILE_LOG.Infof("发件人邮箱包含%s,过滤掉,发件人邮箱地址:%s;标题:%s;所属下标:%d", emailAddress, emailMessage.FromAddress, emailMessage.Title, emailMessage.Uid)
  380. return true
  381. }
  382. }
  383. // 邮件地址中包含待过滤的字符串(大小写敏感的标题),那么就过滤
  384. for _, emailAddress := range global.CONFIG.Email.IgnoreEmailAddressCaseSensitive {
  385. if utils.ContainsWholeWord(emailMessage.FromAddress, emailAddress) {
  386. global.FILE_LOG.Infof("发件人邮箱包含%s,过滤掉,发件人邮箱地址:%s;标题:%s;所属下标:%d", emailAddress, emailMessage.FromAddress, emailMessage.Title, emailMessage.Uid)
  387. return true
  388. }
  389. }
  390. // 邮件标题中包含待过滤的字符串,那么就过滤
  391. lowerTitle := strings.ToLower(emailMessage.Title)
  392. for _, title := range global.CONFIG.Email.IgnoreEmailTitle {
  393. title = strings.ToLower(title)
  394. if utils.ContainsWholeWord(lowerTitle, title) {
  395. global.FILE_LOG.Infof("邮件标题包含%s,过滤掉,标题:%s,所属下标:%d", title, emailMessage.Title, emailMessage.Uid)
  396. return true
  397. }
  398. }
  399. // 邮件标题中包含待过滤的字符串(大小写敏感的标题),那么就过滤
  400. for _, title := range global.CONFIG.Email.IgnoreEmailTitleCaseSensitive {
  401. if utils.ContainsWholeWord(emailMessage.Title, title) {
  402. global.FILE_LOG.Infof("邮件标题包含%s,过滤掉,标题:%s,所属下标:%d", title, emailMessage.Title, emailMessage.Uid)
  403. return true
  404. }
  405. }
  406. return false
  407. }
  408. func RuleCheck(ruleList []report.MailRule, emailMessage MailMessage) bool {
  409. for _, v := range ruleList {
  410. title := strings.ToLower(emailMessage.Title)
  411. rule := strings.ToLower(v.Rule)
  412. if strings.Contains(title, rule) {
  413. return true
  414. }
  415. }
  416. return false
  417. }