EmailParseService.java 45 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931
  1. package com.smppw.modaq.domain.service;
  2. import cn.hutool.core.collection.CollUtil;
  3. import cn.hutool.core.collection.ListUtil;
  4. import cn.hutool.core.date.DateUtil;
  5. import cn.hutool.core.exceptions.ExceptionUtil;
  6. import cn.hutool.core.io.FileUtil;
  7. import cn.hutool.core.map.MapUtil;
  8. import cn.hutool.core.util.StrUtil;
  9. import com.smppw.modaq.application.components.OCRReportParser;
  10. import com.smppw.modaq.application.components.ReportParseUtils;
  11. import com.smppw.modaq.application.components.report.parser.ReportParser;
  12. import com.smppw.modaq.application.components.report.parser.ReportParserFactory;
  13. import com.smppw.modaq.application.components.report.writer.ReportWriter;
  14. import com.smppw.modaq.application.components.report.writer.ReportWriterFactory;
  15. import com.smppw.modaq.application.util.EmailUtil;
  16. import com.smppw.modaq.common.conts.DateConst;
  17. import com.smppw.modaq.common.conts.EmailParseStatusConst;
  18. import com.smppw.modaq.common.conts.EmailTypeConst;
  19. import com.smppw.modaq.common.enums.ReportParseStatus;
  20. import com.smppw.modaq.common.enums.ReportParserFileType;
  21. import com.smppw.modaq.common.enums.ReportType;
  22. import com.smppw.modaq.common.exception.NotSupportReportException;
  23. import com.smppw.modaq.common.exception.ReportParseException;
  24. import com.smppw.modaq.domain.dto.EmailContentInfoDTO;
  25. import com.smppw.modaq.domain.dto.EmailZipFileDTO;
  26. import com.smppw.modaq.domain.dto.MailboxInfoDTO;
  27. import com.smppw.modaq.domain.dto.report.OCRParseData;
  28. import com.smppw.modaq.domain.dto.report.ParseResult;
  29. import com.smppw.modaq.domain.dto.report.ReportData;
  30. import com.smppw.modaq.domain.dto.report.ReportParserParams;
  31. import com.smppw.modaq.domain.entity.EmailFileInfoDO;
  32. import com.smppw.modaq.domain.entity.EmailParseInfoDO;
  33. import com.smppw.modaq.domain.mapper.EmailFileInfoMapper;
  34. import com.smppw.modaq.domain.mapper.EmailParseInfoMapper;
  35. import com.smppw.modaq.infrastructure.util.ArchiveUtil;
  36. import com.smppw.modaq.infrastructure.util.PdfUtil;
  37. import jakarta.mail.*;
  38. import jakarta.mail.internet.MimeUtility;
  39. import jakarta.mail.search.ComparisonTerm;
  40. import jakarta.mail.search.ReceivedDateTerm;
  41. import jakarta.mail.search.SearchTerm;
  42. import org.slf4j.Logger;
  43. import org.slf4j.LoggerFactory;
  44. import org.springframework.beans.factory.annotation.Value;
  45. import org.springframework.stereotype.Service;
  46. import org.springframework.util.StopWatch;
  47. import java.io.File;
  48. import java.io.IOException;
  49. import java.io.InputStream;
  50. import java.nio.file.Files;
  51. import java.nio.file.Path;
  52. import java.nio.file.Paths;
  53. import java.util.*;
  54. import java.util.regex.Matcher;
  55. import java.util.regex.Pattern;
  56. import java.util.stream.Collectors;
  57. /**
  58. * @author mozuwen
  59. * @date 2024-09-04
  60. * @description 邮件解析服务
  61. */
  62. @Service
  63. public class EmailParseService {
  64. // public static final int stepSize = 10000;
  65. private static final Logger log = LoggerFactory.getLogger(EmailParseService.class);
  66. // 扩展支持的 MIME 类型
  67. private static final Set<String> attachmentMimePrefixes = Set.of(
  68. "application/pdf",
  69. "application/zip",
  70. "application/x-zip-compressed",
  71. "application/rar",
  72. "application/x-rar-compressed"
  73. // 按需添加其他类型...
  74. );
  75. // private final EmailFieldMappingMapper emailFieldMapper;
  76. private final EmailParseInfoMapper emailParseInfoMapper;
  77. private final EmailFileInfoMapper emailFileInfoMapper;
  78. /* 报告解析和入库的方法 */
  79. private final ReportParserFactory reportParserFactory;
  80. private final ReportWriterFactory reportWriterFactory;
  81. @Value("${email.file.path}")
  82. private String path;
  83. @Value("${email.report.ocr-parser-url}")
  84. private String ocrParserUrl;
  85. @Value("${email.read-write-seen:true}")
  86. private boolean readWriteSeen;
  87. public EmailParseService(EmailParseInfoMapper emailParseInfoMapper,
  88. EmailFileInfoMapper emailFileInfoMapper,
  89. ReportParserFactory reportParserFactory,
  90. ReportWriterFactory reportWriterFactory) {
  91. this.emailParseInfoMapper = emailParseInfoMapper;
  92. this.emailFileInfoMapper = emailFileInfoMapper;
  93. this.reportParserFactory = reportParserFactory;
  94. this.reportWriterFactory = reportWriterFactory;
  95. }
  96. /**
  97. * 解析指定邮箱指定时间范围内的邮件
  98. *
  99. * @param mailboxInfoDTO 邮箱配置信息
  100. * @param startDate 邮件起始日期(yyyy-MM-dd HH:mm:ss)
  101. * @param endDate 邮件截止日期(yyyy-MM-dd HH:mm:ss, 为null,将解析邮件日期小于等于startDate的当天邮件)
  102. * @param emailTypes 当前任务支持的邮件类型,默认支持确认单
  103. */
  104. public void parseEmail(MailboxInfoDTO mailboxInfoDTO,
  105. Date startDate, Date endDate,
  106. List<String> folderNames, List<Integer> emailTypes) {
  107. if (CollUtil.isEmpty(emailTypes)) {
  108. emailTypes = ListUtil.of(EmailTypeConst.REPORT_LETTER_EMAIL_TYPE);
  109. }
  110. if (log.isInfoEnabled()) {
  111. log.info("开始邮件解析 -> 邮箱信息:{},开始时间:{},结束时间:{}", mailboxInfoDTO, DateUtil.format(startDate,
  112. DateConst.YYYY_MM_DD_HH_MM_SS), DateUtil.format(endDate, DateConst.YYYY_MM_DD_HH_MM_SS));
  113. }
  114. Map<String, List<EmailContentInfoDTO>> emailContentMap;
  115. try {
  116. emailContentMap = this.realEmail(mailboxInfoDTO, startDate, endDate, folderNames);
  117. } catch (Exception e) {
  118. log.error("采集邮件失败 -> 邮箱配置信息:{},堆栈信息:{}", mailboxInfoDTO, ExceptionUtil.stacktraceToString(e));
  119. return;
  120. }
  121. if (MapUtil.isEmpty(emailContentMap)) {
  122. log.warn("未采集到邮件 -> 邮箱配置信息:{},开始时间:{},结束时间:{}", mailboxInfoDTO,
  123. DateUtil.format(startDate, DateConst.YYYY_MM_DD_HH_MM_SS), DateUtil.format(endDate, DateConst.YYYY_MM_DD_HH_MM_SS));
  124. return;
  125. }
  126. for (Map.Entry<String, List<EmailContentInfoDTO>> emailEntry : emailContentMap.entrySet()) {
  127. List<EmailContentInfoDTO> emailContentInfoDTOList = emailEntry.getValue();
  128. if (CollUtil.isEmpty(emailContentInfoDTOList)) {
  129. log.warn("未采集到正文或附件");
  130. continue;
  131. }
  132. log.info("开始解析邮件数据 -> 邮件主题:{},邮件日期:{}", emailContentInfoDTOList.get(0).getEmailTitle(), emailContentInfoDTOList.get(0).getEmailDate());
  133. Map<EmailContentInfoDTO, List<EmailZipFileDTO>> emailZipFileMap = MapUtil.newHashMap();
  134. for (EmailContentInfoDTO emailContentInfoDTO : emailContentInfoDTOList) {
  135. // 正文不用解压附件
  136. if (emailContentInfoDTO.getFileName() != null && emailContentInfoDTO.getFileName().endsWith(".html")) {
  137. emailZipFileMap.put(emailContentInfoDTO, ListUtil.list(false));
  138. continue;
  139. }
  140. try {
  141. List<EmailZipFileDTO> tempList = emailZipFileMap.getOrDefault(emailContentInfoDTO, ListUtil.list(false));
  142. tempList.addAll(this.parseZipEmail(emailContentInfoDTO));
  143. emailZipFileMap.put(emailContentInfoDTO, tempList);
  144. } catch (IOException e) {
  145. log.error("压缩包解压失败:{}", ExceptionUtil.stacktraceToString(e));
  146. EmailParseInfoDO fail = buildEmailParseInfo(null, mailboxInfoDTO.getAccount(), emailContentInfoDTO);
  147. fail.setFailReason("压缩包解压失败");
  148. fail.setParseStatus(EmailParseStatusConst.FAIL);
  149. fail.setEmailKey(emailEntry.getKey());
  150. this.emailParseInfoMapper.insert(fail);
  151. } catch (Exception e) {
  152. log.error("堆栈信息:{}", ExceptionUtil.stacktraceToString(e));
  153. }
  154. }
  155. Iterator<Map.Entry<EmailContentInfoDTO, List<EmailZipFileDTO>>> entryIterator = emailZipFileMap.entrySet().iterator();
  156. while (entryIterator.hasNext()) {
  157. Map.Entry<EmailContentInfoDTO, List<EmailZipFileDTO>> entry = entryIterator.next();
  158. EmailContentInfoDTO key = entry.getKey();
  159. List<EmailZipFileDTO> dtos = entry.getValue();
  160. List<Integer> types = ListUtil.list(false);
  161. types.add(key.getEmailType());
  162. if (CollUtil.isNotEmpty(dtos)) {
  163. List<Integer> list = dtos.stream().map(EmailZipFileDTO::getEmailType).distinct().toList();
  164. CollUtil.addAllIfNotContains(types, list);
  165. }
  166. boolean flag = false;
  167. for (Integer type : types) {
  168. if (emailTypes.contains(type)) {
  169. flag = true;
  170. break;
  171. }
  172. }
  173. if (!flag) {
  174. log.warn("当前邮件{} 的类型{} 不在支持的任务类型{} 中,不用执行解析逻辑。", key, types, emailTypes);
  175. entryIterator.remove();
  176. }
  177. }
  178. // 保存相关信息 -> 邮件信息表,邮件文件表,邮件净值表,邮件规模表,基金净值表
  179. saveRelatedTable(emailEntry.getKey(), mailboxInfoDTO.getAccount(), emailZipFileMap);
  180. log.info("结束邮件解析 -> 邮箱信息:{},开始时间:{},结束时间:{}", emailEntry.getValue(),
  181. DateUtil.format(startDate, DateConst.YYYY_MM_DD_HH_MM_SS), DateUtil.format(endDate, DateConst.YYYY_MM_DD_HH_MM_SS));
  182. }
  183. }
  184. public List<EmailZipFileDTO> parseZipEmail(EmailContentInfoDTO emailContentInfoDTO) throws IOException {
  185. List<EmailZipFileDTO> resultList = ListUtil.list(false);
  186. Integer emailType = emailContentInfoDTO.getEmailType();
  187. String filepath = emailContentInfoDTO.getFilePath();
  188. String emailTitle = emailContentInfoDTO.getEmailTitle();
  189. int fileSize = emailContentInfoDTO.getFileSize();
  190. if (ArchiveUtil.isZip(filepath)) {
  191. handleCompressedFiles(emailTitle, filepath, ".zip", emailType, fileSize, resultList);
  192. } else if (ArchiveUtil.isRAR(filepath)) {
  193. handleCompressedFiles(emailTitle, filepath, ".rar", emailType, fileSize, resultList);
  194. } else {
  195. // 不是压缩包时
  196. EmailZipFileDTO dto = new EmailZipFileDTO(emailTitle, emailContentInfoDTO);
  197. resultList.add(dto);
  198. }
  199. // 文件中的类型判断
  200. if (emailType == null || !EmailTypeConst.SUPPORT_EMAIL_TYPES.contains(emailType)) {
  201. emailType = EmailUtil.getEmailTypeBySubject(emailContentInfoDTO.getFileName());
  202. emailContentInfoDTO.setEmailType(emailType);
  203. }
  204. if (CollUtil.isNotEmpty(resultList)) {
  205. for (EmailZipFileDTO dto : resultList) {
  206. dto.setEmailType(emailType);
  207. }
  208. if (log.isInfoEnabled()) {
  209. log.info("当前邮件{} 所有解压缩文件解压完成:{}", emailTitle, resultList);
  210. }
  211. }
  212. return resultList;
  213. }
  214. private void handleCompressedFiles(String emailTitle, String filepath, String extension,
  215. Integer emailType, int fileSize, List<EmailZipFileDTO> resultList) throws IOException {
  216. String destPath = getDestinationPath(filepath, extension);
  217. File destFile = new File(destPath);
  218. if (!destFile.exists()) {
  219. if (!destFile.mkdirs()) {
  220. throw new IOException("无法创建目标目录: " + destPath);
  221. }
  222. }
  223. List<String> extractedDirs;
  224. if (ArchiveUtil.isZip(filepath)) {
  225. extractedDirs = ArchiveUtil.extractCompressedFiles(filepath, destPath);
  226. } else if (ArchiveUtil.isRAR(filepath)) {
  227. extractedDirs = ArchiveUtil.extractRar5(filepath, destPath);
  228. } else {
  229. return;
  230. }
  231. for (String dir : extractedDirs) {
  232. // 如果邮件类型不满足解析条件则重新根据文件名判断
  233. if (emailType == null || !EmailTypeConst.SUPPORT_EMAIL_TYPES.contains(emailType)) {
  234. emailType = EmailUtil.getEmailTypeBySubject(dir);
  235. }
  236. File file = new File(dir);
  237. if (file.isDirectory()) {
  238. String[] subDirs = file.list();
  239. if (subDirs != null) {
  240. for (String subDir : subDirs) {
  241. resultList.add(new EmailZipFileDTO(emailTitle, subDir, fileSize, emailType));
  242. }
  243. } else {
  244. log.warn("目录 {} 下无文件", dir);
  245. }
  246. } else {
  247. resultList.add(new EmailZipFileDTO(emailTitle, dir, fileSize, emailType));
  248. }
  249. }
  250. }
  251. private String getDestinationPath(String filepath, String extension) {
  252. Path path = Paths.get(filepath);
  253. String fileName = path.getFileName().toString();
  254. String baseName = fileName.substring(0, fileName.length() - extension.length());
  255. return path.getParent().resolve(baseName).toString();
  256. }
  257. public void saveRelatedTable(String emailKey, String emailAddress,
  258. Map<EmailContentInfoDTO, List<EmailZipFileDTO>> emailZipFileMap) {
  259. // python 报告解析接口结果
  260. List<ParseResult<ReportData>> dataList = ListUtil.list(false);
  261. for (Map.Entry<EmailContentInfoDTO, List<EmailZipFileDTO>> entry : emailZipFileMap.entrySet()) {
  262. EmailContentInfoDTO emailDto = entry.getKey();
  263. if (emailDto.getFileName() != null && emailDto.getFileName().endsWith(".html")) {
  264. continue;
  265. }
  266. String emailTitle = emailDto.getEmailTitle();
  267. // 待解析文件数据处理,不支持已存在的文件重复解析
  268. List<EmailZipFileDTO> dtos = ListUtil.list(false);
  269. List<EmailZipFileDTO> zipFiles = entry.getValue();
  270. if (CollUtil.isEmpty(zipFiles)) {
  271. dtos.add(new EmailZipFileDTO(emailTitle, emailDto));
  272. } else {
  273. dtos.addAll(zipFiles);
  274. zipFiles.clear();
  275. }
  276. // 重新判断类型
  277. for (EmailZipFileDTO dto : dtos) {
  278. if (!EmailTypeConst.SUPPORT_NO_OTHER_TYPES.contains(dto.getEmailType())) {
  279. Integer emailType = EmailUtil.getEmailTypeBySubject(emailTitle + dto.getFilename());
  280. dto.setEmailType(emailType);
  281. }
  282. }
  283. // 如果压缩包里面既有pdf又有其他格式的文件,说明其他格式的文件是不需要解析的
  284. List<String> exts = dtos.stream().map(EmailZipFileDTO::getExtName).distinct().toList();
  285. if (exts.contains("pdf") && exts.size() > 1) {
  286. dtos.removeIf(e -> !Objects.equals("pdf", e.getExtName()));
  287. }
  288. // 数据库已存在的数据过滤(邮件主题+报告名称+附件大小)
  289. Iterator<EmailZipFileDTO> iterator = dtos.iterator();
  290. while (iterator.hasNext()) {
  291. EmailZipFileDTO dto = iterator.next();
  292. String filename = dto.getFilename();
  293. // 删除复核函或基金合同
  294. if (filename.contains("复核函") || (filename.contains("基金合同") && !filename.contains("合同变更"))) {
  295. log.warn("邮件{} 中的报告{} 是复核函或基金合同,不用解析上传。", emailTitle, filename);
  296. iterator.remove();
  297. }
  298. Integer emailType = dto.getEmailType();
  299. int fileSize = dto.getFileSize();
  300. int count = 0;
  301. if (Objects.equals(emailType, EmailTypeConst.REPORT_LETTER_EMAIL_TYPE)) {
  302. // 确认单
  303. count = this.emailFileInfoMapper.getLetterFilenameSuccessCount(emailTitle, filename);
  304. } else if (Objects.equals(emailType, EmailTypeConst.REPORT_EMAIL_TYPE)) {
  305. // 定期报告
  306. count = this.emailFileInfoMapper.getAmacFilenameSuccessCount(emailTitle, filename, fileSize);
  307. } else if (Objects.equals(emailType, EmailTypeConst.REPORT_WEEKLY_TYPE)) {
  308. // 管理人周报
  309. count = this.emailFileInfoMapper.getWeeklyFilenameSuccessCount(emailTitle, filename, fileSize);
  310. } else if (Objects.equals(emailType, EmailTypeConst.REPORT_OTHER_TYPE)) {
  311. // 其他报告
  312. count = this.emailFileInfoMapper.getOtherFilenameSuccessCount(emailTitle, filename, fileSize);
  313. } else {
  314. log.info("邮件{} 类型{} 不支持解析。", emailTitle, emailType);
  315. iterator.remove();
  316. }
  317. if (count > 0) {
  318. iterator.remove();
  319. log.info("邮件{} 报告{} 已存在解析成功的记录,不用重新解析。", emailTitle, filename);
  320. }
  321. }
  322. if (CollUtil.isEmpty(dtos)) {
  323. log.info("邮件{} 所有文件都已经解析成功过,不能重复解析了", emailTitle);
  324. continue;
  325. }
  326. if (log.isInfoEnabled()) {
  327. log.info("邮件{} 还有报告待解析:{}", emailTitle, dtos);
  328. }
  329. Integer emailId = emailDto.getEmailId();
  330. EmailParseInfoDO emailParseInfoDO = this.buildEmailParseInfo(emailId, emailAddress, emailDto);
  331. emailParseInfoDO.setEmailKey(emailKey);
  332. emailId = this.saveEmailParseInfo(emailParseInfoDO);
  333. if (emailId == null) {
  334. continue;
  335. }
  336. for (EmailZipFileDTO zipFile : dtos) {
  337. EmailFileInfoDO emailFile = this.saveEmailFileInfo(emailId, zipFile.getFilename(), zipFile.getFilepath());
  338. // 解析并保存报告
  339. ParseResult<ReportData> parseResult = this.parseReportAndHandleResult(emailTitle, emailFile, zipFile);
  340. dataList.add(parseResult);
  341. }
  342. String failReason = null;
  343. int emailParseStatus = EmailParseStatusConst.SUCCESS;
  344. // 报告邮件有一条失败就表示整个邮件解析失败
  345. if (CollUtil.isNotEmpty(dataList)) {
  346. // ai解析结果
  347. List<ReportData> aiParaseList = dataList.stream().map(ParseResult::getData)
  348. .filter(Objects::nonNull).filter(e -> Objects.equals(true, e.getAiParse())).toList();
  349. if (CollUtil.isNotEmpty(aiParaseList)) {
  350. for (ReportData data : aiParaseList) {
  351. this.emailFileInfoMapper.updateAiParseByFileId(data.getBaseInfo().getFileId(), data.getAiParse(), data.getAiFileId());
  352. }
  353. }
  354. long failNum = dataList.stream().filter(e -> !Objects.equals(EmailParseStatusConst.SUCCESS, e.getStatus())).count();
  355. if (failNum > 0) {
  356. emailParseStatus = EmailParseStatusConst.FAIL;
  357. failReason = dataList.stream().map(ParseResult::getMsg).collect(Collectors.joining(";"));
  358. }
  359. }
  360. emailParseInfoMapper.updateParseStatus(emailId, emailParseStatus, failReason);
  361. }
  362. }
  363. private ParseResult<ReportData> parseReportAndHandleResult(String emailTitle, EmailFileInfoDO emailFileInfo, EmailZipFileDTO zipFile) {
  364. Integer emailType = zipFile.getEmailType();
  365. String fileName = zipFile.getFilename();
  366. String filepath = zipFile.getFilepath();
  367. ParseResult<ReportData> result = new ParseResult<>();
  368. boolean reportFlag = emailType == null || !EmailTypeConst.SUPPORT_EMAIL_TYPES.contains(emailType);
  369. if (reportFlag || StrUtil.isBlank(fileName) || fileName.endsWith(".html")) {
  370. result.setStatus(ReportParseStatus.NOT_A_REPORT.getCode());
  371. result.setMsg(StrUtil.format(ReportParseStatus.NOT_A_REPORT.getMsg(), fileName));
  372. log.error(result.getMsg());
  373. return result;
  374. }
  375. // 类型识别---先识别季度报告,没有季度再识别年度报告,最后识别月报
  376. ReportType reportType = ReportParseUtils.matchReportType(emailType, fileName);
  377. if (reportType == null) {
  378. reportType = ReportParseUtils.matchReportType(emailType, emailTitle);
  379. if (log.isDebugEnabled()) {
  380. log.debug("报告{} 根据邮件主题{} 重新识别的类型是:{}", fileName, emailTitle, reportType);
  381. }
  382. }
  383. // 解析器--根据文件后缀获取对应解析器,解析不了就用AI来解析
  384. ReportParserFileType fileType;
  385. String fileSuffix = StrUtil.subAfter(fileName, ".", true);
  386. fileType = ReportParserFileType.getBySuffix(fileSuffix);
  387. // 不支持的格式
  388. if (fileType == null) {
  389. result.setStatus(ReportParseStatus.NO_SUPPORT_TEMPLATE.getCode());
  390. result.setMsg(StrUtil.format(ReportParseStatus.NO_SUPPORT_TEMPLATE.getMsg(), fileName));
  391. log.error(result.getMsg());
  392. return result;
  393. }
  394. // 不是定期报告的判断逻辑放在不支持的格式下面
  395. if (reportType == null) {
  396. result.setStatus(ReportParseStatus.NOT_A_REPORT.getCode());
  397. result.setMsg(StrUtil.format(ReportParseStatus.NOT_A_REPORT.getMsg(), fileName));
  398. log.error(result.getMsg());
  399. return result;
  400. }
  401. Integer fileId = emailFileInfo.getId();
  402. // 首页和尾页转为png图片,首页用来识别基金名称和基金代码、尾页用来识别印章和联系人
  403. List<String> images = ListUtil.list(true);
  404. if (Objects.equals(ReportParserFileType.PDF, fileType)) {
  405. try {
  406. String output = FileUtil.getParent(filepath, 1) + File.separator + "image";
  407. images = PdfUtil.convertFirstAndLastPagesToPng(filepath, FileUtil.file(output), 300);
  408. if (log.isDebugEnabled()) {
  409. log.debug("报告[{}] 生成的图片地址是:{}", fileName, images);
  410. }
  411. } catch (Exception e) {
  412. log.warn("报告[{}] 生成图片失败:{}", fileName, ExceptionUtil.stacktraceToString(e));
  413. }
  414. } else if (Objects.equals(ReportParserFileType.IMG, fileType)) {
  415. try {
  416. String outputFile = PdfUtil.compressAndSave(filepath);
  417. images.add(outputFile);
  418. } catch (IOException e) {
  419. log.error("报告{} 图片压缩失败,{}", fileName, ExceptionUtil.stacktraceToString(e));
  420. }
  421. }
  422. // 不支持解析的格式文件
  423. boolean notSupportFile = false;
  424. // 解析报告
  425. ReportData reportData = null;
  426. ReportParserParams params = new ReportParserParams(fileId, fileName, filepath, reportType);
  427. StopWatch parserWatch = new StopWatch();
  428. parserWatch.start();
  429. try {
  430. if (reportType != ReportType.OTHER && reportType != ReportType.WEEKLY) {
  431. ReportParser<ReportData> instance = this.reportParserFactory.getInstance(reportType, fileType);
  432. reportData = instance.parse(params);
  433. result.setStatus(1);
  434. result.setMsg("报告解析成功");
  435. result.setData(reportData);
  436. } else {
  437. if (log.isInfoEnabled()) {
  438. log.info("报告{} 是周报或其他类型,直接用AI解析器解析", fileName);
  439. }
  440. }
  441. } catch (ReportParseException e) {
  442. log.error("解析失败:{}", StrUtil.format(e.getMsg(), fileName));
  443. result.setStatus(e.getCode());
  444. result.setMsg(StrUtil.format(e.getMsg(), fileName));
  445. if (e instanceof NotSupportReportException) {
  446. notSupportFile = true;
  447. }
  448. } catch (Exception e) {
  449. log.error("解析错误:{}", ExceptionUtil.stacktraceToString(e));
  450. result.setStatus(ReportParseStatus.PARSE_FAIL.getCode());
  451. result.setMsg(StrUtil.format(ReportParseStatus.PARSE_FAIL.getMsg(), e.getMessage()));
  452. } finally {
  453. // 如果解析结果是空的就用AI工具解析一次
  454. if (reportData == null && !notSupportFile) {
  455. if (reportType == ReportType.QUARTERLY || reportType == ReportType.ANNUALLY) {
  456. if (log.isInfoEnabled()) {
  457. log.info("报告{} 开始AI解析......", fileName);
  458. }
  459. } else if (CollUtil.isNotEmpty(images)) {
  460. filepath = images.get(0);
  461. if (log.isInfoEnabled()) {
  462. log.info("报告{} 用首页图片{} 开始AI解析......", fileName, filepath);
  463. }
  464. }
  465. try {
  466. params = new ReportParserParams(fileId, fileName, filepath, reportType);
  467. ReportParser<ReportData> instance = this.reportParserFactory.getInstance(reportType, ReportParserFileType.AI);
  468. reportData = instance.parse(params);
  469. result.setStatus(1);
  470. result.setMsg("报告解析成功--AI");
  471. result.setData(reportData);
  472. } catch (ReportParseException e) {
  473. log.error("AI解析失败:{}", StrUtil.format(e.getMsg(), fileName));
  474. result.setStatus(e.getCode());
  475. result.setMsg(StrUtil.format(e.getMsg(), fileName));
  476. } catch (Exception e) {
  477. log.error("AI解析错误:{}", ExceptionUtil.stacktraceToString(e));
  478. result.setStatus(ReportParseStatus.PARSE_FAIL.getCode());
  479. result.setMsg(StrUtil.format(ReportParseStatus.PARSE_FAIL.getMsg(), e.getMessage()));
  480. }
  481. if (log.isInfoEnabled()) {
  482. log.info("报告{} AI解析结束!", fileName);
  483. }
  484. }
  485. // ocr信息提取
  486. this.ocrReportData(reportType, reportData, fileName, images);
  487. parserWatch.stop();
  488. if (log.isInfoEnabled()) {
  489. log.info("报告{}解析结果为{},耗时{}ms", fileName, reportData, parserWatch.getTotalTimeMillis());
  490. }
  491. }
  492. // 保存报告解析结果
  493. this.saveReportData(reportData, reportType, fileName);
  494. return result;
  495. }
  496. /**
  497. * ocr 提取信息(包括首页的基金名称或报告日期,尾页的印章或联系人等信息)
  498. *
  499. * @param reportData 报告解析结果
  500. * @param fileName 报告名称
  501. * @param images 报告的收益和尾页png图片
  502. */
  503. private void ocrReportData(ReportType reportType, ReportData reportData, String fileName, List<String> images) {
  504. if (reportData == null || CollUtil.isEmpty(images)) {
  505. return;
  506. }
  507. OCRParseData parseRes = null;
  508. // 报告才识别尾页的印章和联系人,确认单不识别尾页
  509. if (ReportType.LETTER != reportType) {
  510. try {
  511. // 首页和尾页相等时只读首页
  512. String imageUrl = images.size() == 1 ? images.get(0) : images.get(1);
  513. parseRes = new OCRReportParser().parse(fileName, this.ocrParserUrl, imageUrl);
  514. } catch (Exception e) {
  515. log.error("报告{} OCR识别印章和联系人出错:{}", fileName, ExceptionUtil.stacktraceToString(e));
  516. }
  517. // ocr识别尾页是否包含印章和联系人信息
  518. if (parseRes != null) {
  519. if (reportData.getBaseInfo() != null) {
  520. reportData.getBaseInfo().setWithSeals(parseRes.getWithSeals());
  521. reportData.getBaseInfo().setWithContacts(parseRes.getWithContacts());
  522. if (fileName.contains("用印") && !Objects.equals(true, reportData.getBaseInfo().getWithSeals())) {
  523. reportData.getBaseInfo().setWithSeals(true);
  524. }
  525. }
  526. }
  527. }
  528. // 用首页识别基金名称、产品代码和报告日期
  529. if ((reportData.getBaseInfo() != null && reportData.getBaseInfo().getReportDate() == null)
  530. || (reportData.getFundInfo() != null && StrUtil.isBlank(reportData.getFundInfo().getFundName()))
  531. || (reportData.getFundInfo() != null && StrUtil.isBlank(reportData.getFundInfo().getFundCode()))) {
  532. // 首页和尾页不相等时解析首页的数据
  533. if (images.size() != 1) {
  534. try {
  535. parseRes = new OCRReportParser().parse(fileName, this.ocrParserUrl, images.get(0));
  536. } catch (Exception e) {
  537. log.error("报告{} OCR识别首页基金名称和报告日期出错:{}", fileName, ExceptionUtil.stacktraceToString(e));
  538. }
  539. }
  540. // ocr 识别的结果优先级更高
  541. if (reportData.getFundInfo() != null && parseRes != null) {
  542. if (StrUtil.isBlank(reportData.getFundInfo().getFundName())
  543. || (StrUtil.isNotBlank(parseRes.getFundName())
  544. && !Objects.equals(reportData.getFundInfo().getFundName(), parseRes.getFundName()))) {
  545. reportData.getFundInfo().setFundName(parseRes.getFundName());
  546. }
  547. if (StrUtil.isBlank(reportData.getFundInfo().getFundCode())
  548. || (StrUtil.isNotBlank(parseRes.getFundCode())
  549. && !Objects.equals(reportData.getFundInfo().getFundCode(), parseRes.getFundCode()))) {
  550. reportData.getFundInfo().setFundCode(parseRes.getFundCode());
  551. }
  552. }
  553. }
  554. }
  555. /**
  556. * 保存报告解析结果
  557. *
  558. * @param reportData 报告解析结果
  559. * @param reportType 报告类型
  560. * @param fileName 报告名称
  561. */
  562. private void saveReportData(ReportData reportData, ReportType reportType, String fileName) {
  563. if (reportData == null) {
  564. return;
  565. }
  566. StopWatch writeWatch = new StopWatch();
  567. writeWatch.start();
  568. try {
  569. ReportWriter<ReportData> instance = this.reportWriterFactory.getInstance(reportType);
  570. instance.write(reportData);
  571. } catch (Exception e) {
  572. log.error("报告{}结果保存失败\n{}", fileName, ExceptionUtil.stacktraceToString(e));
  573. } finally {
  574. writeWatch.stop();
  575. if (log.isInfoEnabled()) {
  576. log.info("报告{}解析结果保存完成,耗时{}ms", fileName, writeWatch.getTotalTimeMillis());
  577. }
  578. }
  579. }
  580. private EmailFileInfoDO saveEmailFileInfo(Integer emailId, String fileName, String filePath) {
  581. EmailFileInfoDO emailFileInfoDO = buildEmailFileInfoDO(emailId, fileName, filePath);
  582. emailFileInfoDO.setAiFileId(null);
  583. if (emailFileInfoDO.getId() != null) {
  584. emailFileInfoMapper.updateTimeById(null, new Date());
  585. return emailFileInfoDO;
  586. }
  587. emailFileInfoMapper.insert(emailFileInfoDO);
  588. return emailFileInfoDO;
  589. }
  590. private EmailFileInfoDO buildEmailFileInfoDO(Integer emailId, String fileName, String filePath) {
  591. EmailFileInfoDO emailFileInfoDO = new EmailFileInfoDO();
  592. emailFileInfoDO.setId(null);
  593. emailFileInfoDO.setEmailId(emailId);
  594. emailFileInfoDO.setFileName(fileName);
  595. emailFileInfoDO.setFilePath(filePath);
  596. emailFileInfoDO.setIsvalid(1);
  597. emailFileInfoDO.setCreatorId(0);
  598. emailFileInfoDO.setCreateTime(new Date());
  599. emailFileInfoDO.setUpdaterId(0);
  600. emailFileInfoDO.setUpdateTime(new Date());
  601. return emailFileInfoDO;
  602. }
  603. private Integer saveEmailParseInfo(EmailParseInfoDO emailParseInfoDO) {
  604. if (emailParseInfoDO == null) {
  605. return null;
  606. }
  607. // 重新邮件功能 -> 修改解析时间和更新时间
  608. if (emailParseInfoDO.getId() != null) {
  609. emailParseInfoMapper.updateParseTime(emailParseInfoDO.getId(), emailParseInfoDO.getParseDate());
  610. return emailParseInfoDO.getId();
  611. }
  612. emailParseInfoMapper.insert(emailParseInfoDO);
  613. return emailParseInfoDO.getId();
  614. }
  615. private EmailParseInfoDO buildEmailParseInfo(Integer emailId, String emailAddress, EmailContentInfoDTO emailContentInfoDTO) {
  616. EmailParseInfoDO emailParseInfoDO = new EmailParseInfoDO();
  617. emailParseInfoDO.setId(emailId);
  618. emailParseInfoDO.setSenderEmail(emailContentInfoDTO.getSenderEmail());
  619. emailParseInfoDO.setEmail(emailAddress);
  620. emailParseInfoDO.setEmailDate(DateUtil.parse(emailContentInfoDTO.getEmailDate(), DateConst.YYYY_MM_DD_HH_MM_SS));
  621. emailParseInfoDO.setParseDate(emailContentInfoDTO.getParseDate() == null ? null : DateUtil.parseDate(emailContentInfoDTO.getParseDate()));
  622. emailParseInfoDO.setEmailTitle(emailContentInfoDTO.getEmailTitle());
  623. emailParseInfoDO.setEmailType(emailContentInfoDTO.getEmailType());
  624. emailParseInfoDO.setParseStatus(EmailParseStatusConst.SUCCESS);
  625. emailParseInfoDO.setAttrSize(emailContentInfoDTO.getFileSize());
  626. emailParseInfoDO.setIsvalid(1);
  627. emailParseInfoDO.setCreatorId(0);
  628. emailParseInfoDO.setCreateTime(new Date());
  629. emailParseInfoDO.setUpdaterId(0);
  630. emailParseInfoDO.setUpdateTime(new Date());
  631. return emailParseInfoDO;
  632. }
  633. /**
  634. * 读取邮件
  635. *
  636. * @param mailboxInfoDTO 邮箱配置信息
  637. * @param startDate 邮件起始日期
  638. * @param endDate 邮件截止日期(为null,将解析邮件日期小于等于startDate的当天邮件)
  639. * @return 读取到的邮件信息
  640. * @throws Exception 异常信息
  641. */
  642. private Map<String, List<EmailContentInfoDTO>> realEmail(MailboxInfoDTO mailboxInfoDTO,
  643. Date startDate, Date endDate,
  644. List<String> folderNames) throws Exception {
  645. if (CollUtil.isEmpty(folderNames)) {
  646. folderNames = ListUtil.toList("INBOX");
  647. }
  648. Store store = EmailUtil.getStoreNew(mailboxInfoDTO);
  649. if (store == null) {
  650. return MapUtil.newHashMap(4);
  651. }
  652. Map<String, List<EmailContentInfoDTO>> result = MapUtil.newHashMap(128);
  653. try {
  654. if (log.isInfoEnabled()) {
  655. Folder[] list = store.getDefaultFolder().list("*");
  656. List<String> names = Arrays.stream(list).map(Folder::getFullName).toList();
  657. log.info("获取所有邮箱文件夹:{}", names);
  658. }
  659. for (String folderName : folderNames) {
  660. try {
  661. Map<String, List<EmailContentInfoDTO>> temp = this.getFolderEmail(mailboxInfoDTO,
  662. startDate, endDate, store, folderName);
  663. if (MapUtil.isNotEmpty(temp)) {
  664. result.putAll(temp);
  665. }
  666. } catch (Exception e) {
  667. log.warn("文件夹{} 邮件获取失败:{}", folderName, ExceptionUtil.stacktraceToString(e));
  668. }
  669. }
  670. } catch (Exception e) {
  671. log.error("邮件获取失败:{}", ExceptionUtil.stacktraceToString(e));
  672. } finally {
  673. store.close();
  674. }
  675. return result;
  676. }
  677. private Map<String, List<EmailContentInfoDTO>> getFolderEmail(MailboxInfoDTO mailboxInfoDTO,
  678. Date startDate, Date endDate,
  679. Store store, String folderName) throws MessagingException {
  680. // 默认读取收件箱的邮件
  681. Folder folder = store.getFolder(folderName);
  682. folder.open(this.readWriteSeen ? Folder.READ_WRITE : Folder.READ_ONLY);
  683. Message[] messages = getEmailMessage(folder, mailboxInfoDTO.getProtocol(), startDate);
  684. if (messages == null || messages.length == 0) {
  685. log.warn("{} 获取不到邮件 -> 邮箱信息:{},开始时间:{},结束时间:{}", folderName, mailboxInfoDTO, startDate, endDate);
  686. return MapUtil.newHashMap();
  687. }
  688. Map<String, List<EmailContentInfoDTO>> emailMessageMap = MapUtil.newHashMap();
  689. for (Message message : messages) {
  690. long start = System.currentTimeMillis();
  691. List<EmailContentInfoDTO> emailContentInfoDTOList = CollUtil.newArrayList();
  692. String uuidKey = UUID.randomUUID().toString().replaceAll("-", "");
  693. Integer emailType;
  694. String senderEmail;
  695. String emailTitle = message.getSubject();
  696. if (this.readWriteSeen && isMessageRead(message)) {
  697. log.warn("{} 邮件{} 已读,不用重新下载解析!", folderName, emailTitle);
  698. continue;
  699. }
  700. try {
  701. Date emailDate = message.getSentDate();
  702. String emailDateStr = DateUtil.format(emailDate, DateConst.YYYY_MM_DD_HH_MM_SS);
  703. if (log.isInfoEnabled()) {
  704. log.info("{} 邮件{} 数据获取中,邮件时间:{}", folderName, emailTitle, emailDateStr);
  705. }
  706. boolean isNotParseConditionSatisfied = emailDate == null
  707. || (endDate != null && emailDate.compareTo(endDate) > 0)
  708. || (startDate != null && emailDate.compareTo(startDate) < 0);
  709. if (isNotParseConditionSatisfied) {
  710. String st = DateUtil.formatDateTime(startDate);
  711. String ed = DateUtil.formatDateTime(endDate);
  712. log.warn("{} 邮件[{}]日期{}不在区间内【{} ~ {}】", folderName, emailTitle, emailDateStr, st, ed);
  713. continue;
  714. }
  715. senderEmail = getSenderEmail(message);
  716. emailType = EmailUtil.getEmailTypeBySubject(emailTitle);
  717. if (emailType == null) {
  718. log.warn("{} 邮件不满足解析条件 -> 邮件主题:{},邮件日期:{}", folderName, emailTitle, emailDateStr);
  719. continue;
  720. }
  721. if (log.isInfoEnabled()) {
  722. log.info("{} 邮件{} 基本信息获取完成,开始下载附件!邮件日期:{}", folderName, emailTitle, emailDateStr);
  723. }
  724. Object content = message.getContent();
  725. if (content instanceof Multipart multipart) {
  726. this.reMultipart(mailboxInfoDTO.getAccount(), emailTitle, emailDate, multipart, emailContentInfoDTOList);
  727. } else if (content instanceof Part part) {
  728. this.rePart(mailboxInfoDTO.getAccount(), emailTitle, emailDate, part, emailContentInfoDTOList);
  729. } else {
  730. log.warn("{} 不支持的邮件数据 {}", folderName, emailTitle);
  731. }
  732. if (CollUtil.isNotEmpty(emailContentInfoDTOList)) {
  733. emailContentInfoDTOList.forEach(e -> {
  734. e.setEmailType(emailType);
  735. e.setSenderEmail(senderEmail);
  736. });
  737. emailMessageMap.put(uuidKey, emailContentInfoDTOList);
  738. }
  739. if (log.isInfoEnabled()) {
  740. log.info("{} 邮件{} 下载完成,总计耗时{} ms,文件内容如下\n {}", folderName,
  741. emailTitle, System.currentTimeMillis() - start, emailContentInfoDTOList);
  742. }
  743. } catch (Exception e) {
  744. log.error("{} 获取邮箱的邮件{} 报错,堆栈信息:{}", folderName, emailTitle, ExceptionUtil.stacktraceToString(e));
  745. }
  746. }
  747. if (this.readWriteSeen) {
  748. // 设置已读标志
  749. folder.setFlags(messages, new Flags(Flags.Flag.SEEN), true);
  750. }
  751. folder.close(false);
  752. return emailMessageMap;
  753. }
  754. private void rePart(String account, String subject, Date sendDate, Part part,
  755. List<EmailContentInfoDTO> emailContentInfoDTOList) throws Exception {
  756. String fileName = EmailUtil.decodeFileName(part);
  757. if (StrUtil.isBlank(fileName)) {
  758. log.warn("邮件{} 附件文件名是空的,不做下载!", subject);
  759. return;
  760. }
  761. if (fileName.contains("=?")) {
  762. fileName = MimeUtility.decodeText(fileName);
  763. }
  764. String disposition = part.getDisposition();
  765. String contentType = part.getContentType();
  766. boolean isAttachment = Part.ATTACHMENT.equalsIgnoreCase(disposition)
  767. || (contentType != null && attachmentMimePrefixes.stream().anyMatch(prefix ->
  768. StrUtil.startWithIgnoreCase(contentType, prefix)
  769. ));
  770. if (!isAttachment) {
  771. log.warn("邮件 {} 未检测到pdf/zip/rar类型的附件 (fileName={}, disposition={}, contentType={})",
  772. subject, fileName, disposition, contentType);
  773. return;
  774. }
  775. String emailDateStr = DateUtil.format(sendDate, DateConst.YYYYMMDD);
  776. String filePath = path + File.separator + account + File.separator + emailDateStr + File.separator;
  777. // 压缩包重名时的后面的压缩包会覆盖前面压缩包的问题(不考虑普通文件)
  778. String emailDate = DateUtil.format(sendDate, DateConst.YYYYMMDDHHMMSS24);
  779. String realName = (fileName.endsWith(".zip") || fileName.endsWith(".rar")) ? emailDate + fileName : fileName;
  780. File saveFile = FileUtil.file(filePath + realName);
  781. if (!saveFile.exists()) {
  782. if (!saveFile.getParentFile().exists()) {
  783. boolean mkdirs = saveFile.getParentFile().mkdirs();
  784. if (!mkdirs) {
  785. log.warn("file path mkdir failed.");
  786. }
  787. }
  788. try (InputStream is = part.getInputStream()) {
  789. Files.copy(is, saveFile.toPath());
  790. }
  791. } else {
  792. FileUtil.del(saveFile);
  793. try (InputStream is = part.getInputStream()) {
  794. Files.copy(is, saveFile.toPath());
  795. }
  796. }
  797. EmailContentInfoDTO emailContentInfoDTO = new EmailContentInfoDTO();
  798. emailContentInfoDTO.setFileName(fileName);
  799. emailContentInfoDTO.setFileSize(part.getSize());
  800. emailContentInfoDTO.setFilePath(saveFile.getAbsolutePath());
  801. emailContentInfoDTO.setEmailAddress(account);
  802. emailContentInfoDTO.setEmailTitle(subject);
  803. emailContentInfoDTO.setEmailDate(DateUtil.format(sendDate, DateConst.YYYY_MM_DD_HH_MM_SS));
  804. emailContentInfoDTOList.add(emailContentInfoDTO);
  805. }
  806. private void reMultipart(String account, String subject, Date emailDate, Multipart multipart,
  807. List<EmailContentInfoDTO> emailContentInfoDTOList) throws Exception {
  808. for (int i = 0; i < multipart.getCount(); i++) {
  809. Part bodyPart = multipart.getBodyPart(i);
  810. Object content = bodyPart.getContent();
  811. if (content instanceof String) {
  812. if (log.isDebugEnabled()) {
  813. log.debug("邮件{} 获取的正文不做解析,内容是 {}", subject, content);
  814. }
  815. continue;
  816. }
  817. if (content instanceof Multipart mp) {
  818. this.reMultipart(account, subject, emailDate, mp, emailContentInfoDTOList);
  819. } else {
  820. this.rePart(account, subject, emailDate, bodyPart, emailContentInfoDTOList);
  821. }
  822. }
  823. }
  824. private String getSenderEmail(Message message) {
  825. Address[] senderAddress;
  826. try {
  827. senderAddress = message.getFrom();
  828. if (senderAddress == null || senderAddress.length == 0) {
  829. return null;
  830. }
  831. // 此时的address是含有编码(MIME编码方式)后的文本和实际的邮件地址
  832. String address = "";
  833. for (Address from : senderAddress) {
  834. if (StrUtil.isNotBlank(from.toString())) {
  835. address = from.toString();
  836. break;
  837. }
  838. }
  839. // 正则表达式匹配邮件地址
  840. Pattern pattern = Pattern.compile("<(\\S+)>");
  841. Matcher matcher = pattern.matcher(address);
  842. if (matcher.find()) {
  843. return matcher.group(1);
  844. }
  845. } catch (MessagingException e) {
  846. log.error(e.getMessage(), e);
  847. }
  848. return null;
  849. }
  850. private Message[] getEmailMessage(Folder folder, String protocol, Date startDate) {
  851. try {
  852. if (protocol.contains("imap")) {
  853. // 获取邮件日期大于等于startDate的邮件(搜索条件只支持按天)
  854. SearchTerm startDateTerm = new ReceivedDateTerm(ComparisonTerm.GE, startDate);
  855. return folder.search(startDateTerm);
  856. } else {
  857. return folder.getMessages();
  858. }
  859. } catch (MessagingException e) {
  860. throw new RuntimeException(e);
  861. }
  862. }
  863. /**
  864. * 检查邮件是否已读
  865. *
  866. * @param message 邮件对象
  867. * @return true表示已读,false表示未读
  868. * @throws MessagingException 如果访问邮件标志时出错
  869. */
  870. private boolean isMessageRead(Message message) throws MessagingException {
  871. // 获取邮件的所有标志
  872. Flags flags = message.getFlags();
  873. // 检查是否包含 SEEN 标志
  874. return flags.contains(Flags.Flag.SEEN);
  875. }
  876. }