Преглед изворни кода

fix:修复确认DNA部分没有识别到文件编码的问题

wangzaijun пре 1 месец
родитељ
комит
17c0dd77c5

+ 6 - 0
mo-daq/src/main/java/com/smppw/modaq/application/components/ReportParseUtils.java

@@ -579,5 +579,11 @@ public final class ReportParseUtils {
         emailType = EmailUtil.getEmailTypeBySubject(text);
         reportType = matchReportType(emailType, text);
         System.out.println(emailType + ",reportType=" + reportType + ",reportDate=" + matchReportDate(reportType, text));
+
+        text = "(水印)SH7639_年报_龙旗巨星一号私募投资基金_2024年 (2).pdf";
+        emailType = EmailUtil.getEmailTypeBySubject(text);
+        reportType = matchReportType(emailType, text);
+        System.out.println(emailType + ",reportType=" + reportType + ",reportDate=" + matchReportDate(reportType, text));
+
     }
 }

+ 1 - 0
mo-daq/src/main/java/com/smppw/modaq/infrastructure/util/ExcelUtil.java

@@ -417,6 +417,7 @@ public class ExcelUtil {
     private static boolean hasLowMeaningfulness(String text) {
         // 假设正常文本应包含常见停用词(的、是、在等)
         List<String> commonWords = ListUtil.list(false);
+        commonWords.add("基金");
         commonWords.addAll(ListUtil.toList(ReportType.ANNUALLY.getPatterns()));
         commonWords.addAll(ListUtil.toList(ReportType.QUARTERLY.getPatterns()));
         commonWords.addAll(ListUtil.toList(ReportType.MONTHLY.getPatterns()));