NavEmailParser.java 30 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558
  1. package com.simuwang.daq.service;
  2. import cn.hutool.core.collection.CollUtil;
  3. import cn.hutool.core.collection.ListUtil;
  4. import cn.hutool.core.exceptions.ExceptionUtil;
  5. import cn.hutool.core.lang.Pair;
  6. import cn.hutool.core.map.MapUtil;
  7. import cn.hutool.core.util.StrUtil;
  8. import com.simuwang.base.common.conts.EmailDataDirectionConst;
  9. import com.simuwang.base.common.conts.EmailFieldConst;
  10. import com.simuwang.base.common.conts.EmailTypeConst;
  11. import com.simuwang.base.common.util.DateUtils;
  12. import com.simuwang.base.common.util.ExcelUtil;
  13. import com.simuwang.base.common.util.StringUtil;
  14. import com.simuwang.base.pojo.dto.EmailContentInfoDTO;
  15. import com.simuwang.base.pojo.dto.EmailFundNavDTO;
  16. import com.simuwang.base.pojo.dto.FieldPositionDTO;
  17. import org.apache.poi.ss.usermodel.Cell;
  18. import org.apache.poi.ss.usermodel.Row;
  19. import org.apache.poi.ss.usermodel.Sheet;
  20. import org.slf4j.Logger;
  21. import org.slf4j.LoggerFactory;
  22. import org.springframework.beans.factory.annotation.Value;
  23. import org.springframework.stereotype.Component;
  24. import java.io.File;
  25. import java.util.*;
  26. import java.util.stream.Collectors;
  27. /**
  28. * @author mozuwen
  29. * @date 2024-09-04
  30. * @description 净值邮件解析器
  31. */
  32. @Component
  33. public class NavEmailParser extends AbstractEmailParser {
  34. private static final Logger log = LoggerFactory.getLogger(AbstractEmailParser.class);
  35. @Value("${email.file.path}")
  36. private String path;
  37. @Value("${email.parse.force-template-enable}")
  38. private boolean forceTemplateEnable;
  39. private final ValuationEmailParser valuationEmailParser;
  40. private final EmailTemplateService emailTemplateService;
  41. private static final int MAX_COLUMN = 20;
  42. private static final List<String> NOT_CONVERT_FIELD_LIST = ListUtil.toList("TA代码");
  43. public NavEmailParser(ValuationEmailParser valuationEmailParser, EmailTemplateService emailTemplateService) {
  44. this.valuationEmailParser = valuationEmailParser;
  45. this.emailTemplateService = emailTemplateService;
  46. }
  47. @Override
  48. public boolean isSupport(Integer emailType) {
  49. return EmailTypeConst.NAV_EMAIL_TYPE.equals(emailType);
  50. }
  51. @Override
  52. public List<EmailFundNavDTO> parse(EmailContentInfoDTO emailContentInfoDTO, Map<String, List<String>> emailFieldMap) {
  53. List<EmailFundNavDTO> emailFundNavDTOList = CollUtil.newArrayList();
  54. String emailContent = emailContentInfoDTO.getEmailContent();
  55. // 1.解析邮件正文
  56. if (StrUtil.isNotBlank(emailContentInfoDTO.getFilePath()) && ExcelUtil.isHTML(emailContentInfoDTO.getFileName())) {
  57. String excelFilePath = emailContentInfoDTO.getFilePath().replace(".html", ".xlsx");
  58. emailFundNavDTOList = parseEmailContent(emailContent, excelFilePath, emailFieldMap);
  59. }
  60. // 2.解析邮件excel附件
  61. if (StrUtil.isNotBlank(emailContentInfoDTO.getFilePath()) && ExcelUtil.isExcel(emailContentInfoDTO.getFileName())) {
  62. List<EmailFundNavDTO> fundNavDTOList = parseExcelFile(emailContentInfoDTO.getFilePath(), emailFieldMap);
  63. Optional.ofNullable(fundNavDTOList).ifPresent(emailFundNavDTOList::addAll);
  64. }
  65. // 3.解析邮件pdf附件
  66. if (StrUtil.isNotBlank(emailContentInfoDTO.getFilePath()) && ExcelUtil.isPdf(emailContentInfoDTO.getFileName())) {
  67. String excelFilePath = path + emailContentInfoDTO.getEmailAddress() + "/" + emailContentInfoDTO.getEmailDate().substring(0, 10).replaceAll("-", "")
  68. + "/" + emailContentInfoDTO.getFileName().replace(".pdf", System.currentTimeMillis()+".xlsx").replace(".PDF", System.currentTimeMillis()+".xlsx");
  69. List<EmailFundNavDTO> fundNavDTOList = parsePdfFile(emailContentInfoDTO.getFilePath(), excelFilePath, emailFieldMap);
  70. Optional.ofNullable(fundNavDTOList).ifPresent(emailFundNavDTOList::addAll);
  71. }
  72. // 4.解析邮件zip,rar附件
  73. if (StrUtil.isNotBlank(emailContentInfoDTO.getFilePath()) && (ExcelUtil.isZip(emailContentInfoDTO.getFileName()) || ExcelUtil.isRAR(emailContentInfoDTO.getFileName()))) {
  74. List<EmailFundNavDTO> fundNavDTOList = parsePackageFile(emailContentInfoDTO, emailContentInfoDTO.getFileName(), emailContentInfoDTO.getFilePath(), emailFieldMap);
  75. Optional.ofNullable(fundNavDTOList).ifPresent(emailFundNavDTOList::addAll);
  76. }
  77. // 兼容净值邮件,但附件是估值表的情况
  78. if (CollUtil.isEmpty(emailFundNavDTOList)) {
  79. // 判断文件名是否包含"估值表"
  80. String fileName = emailContentInfoDTO.getFileName();
  81. if (StrUtil.isNotBlank(fileName) && fileName.contains("估值表")) {
  82. emailFundNavDTOList = valuationEmailParser.parse(emailContentInfoDTO, emailFieldMap);
  83. }
  84. }
  85. // email_fund_nav增加template_id字段
  86. if (CollUtil.isNotEmpty(emailFundNavDTOList)) {
  87. emailFundNavDTOList.forEach(e -> e.setTemplateId(0));
  88. }
  89. // 通用模版解析 -> 根据配置的模板进行解析
  90. long successNavCount = 0;
  91. if (CollUtil.isNotEmpty(emailFundNavDTOList)) {
  92. successNavCount = emailFundNavDTOList.stream().filter(e -> e != null && StrUtil.isBlank(e.getFailReason())).count();
  93. }
  94. //如果通用模板解析不到正确数据,就走模板解析一次
  95. if (successNavCount == 0 || forceTemplateEnable) {
  96. List<EmailFundNavDTO> templateFundNavDTOList = emailTemplateService.parseUsingTemplate(emailContentInfoDTO);
  97. if(CollUtil.isNotEmpty(templateFundNavDTOList)){
  98. emailFundNavDTOList.addAll(templateFundNavDTOList);
  99. }
  100. }
  101. return emailFundNavDTOList;
  102. }
  103. private List<EmailFundNavDTO> parsePackageFile(EmailContentInfoDTO emailContentInfoDTO, String fileName, String filePath, Map<String, List<String>> emailFieldMap) {
  104. List<EmailFundNavDTO> emailFundNavDTOList = CollUtil.newArrayList();
  105. if(ExcelUtil.isZip(filePath)){
  106. String destPath = filePath.replaceAll(".zip", "").replaceAll(".ZIP", "");
  107. log.info("压缩包地址:{},解压后文件地址:{}", filePath, destPath);
  108. List<String> dir = ExcelUtil.extractCompressedFiles(filePath, destPath);
  109. for (String zipFilePath : dir) {
  110. emailFundNavDTOList.addAll(parseZipFile(emailContentInfoDTO, zipFilePath, emailFieldMap));
  111. File file = new File(zipFilePath);
  112. if (file.isDirectory()) {
  113. for (String navFilePath : Objects.requireNonNull(file.list())) {
  114. emailFundNavDTOList.addAll(parseZipFile(emailContentInfoDTO, navFilePath, emailFieldMap));
  115. }
  116. }
  117. }
  118. }
  119. try{
  120. if(ExcelUtil.isRAR(filePath)){
  121. String destPath = filePath.replaceAll(".rar", "").replaceAll(".RAR", "");
  122. File destFile = new File(destPath);
  123. if (!destFile.exists()) {
  124. destFile.mkdirs();
  125. }
  126. List<String> rarDir = ExcelUtil.extractRar(filePath, destPath);
  127. for (String rarFilePath : rarDir) {
  128. emailFundNavDTOList.addAll(parseZipFile(emailContentInfoDTO, rarFilePath, emailFieldMap));
  129. File file = new File(rarFilePath);
  130. if (file.isDirectory()) {
  131. for (String navFilePath : Objects.requireNonNull(file.list())) {
  132. emailFundNavDTOList.addAll(parseZipFile(emailContentInfoDTO, navFilePath, emailFieldMap));
  133. }
  134. }
  135. }
  136. }
  137. }catch (Exception e){
  138. log.error(e.getMessage(),e);
  139. }
  140. return emailFundNavDTOList;
  141. }
  142. private List<EmailFundNavDTO> parseZipFile(EmailContentInfoDTO emailContentInfoDTO, String zipFilePath, Map<String, List<String>> emailFieldMap) {
  143. List<EmailFundNavDTO> fundNavDTOList = CollUtil.newArrayList();
  144. if (ExcelUtil.isPdf(zipFilePath)) {
  145. String excelFilePath = zipFilePath.replace(".pdf", System.currentTimeMillis()+".xlsx").replace(".PDF", System.currentTimeMillis()+".xlsx");
  146. fundNavDTOList = parsePdfFile(zipFilePath, excelFilePath, emailFieldMap);
  147. }
  148. if (ExcelUtil.isExcel(zipFilePath)) {
  149. fundNavDTOList = parseExcelFile(zipFilePath, emailFieldMap);
  150. }
  151. if (ExcelUtil.isZip(zipFilePath)) {
  152. String name = new File(zipFilePath).getName();
  153. fundNavDTOList = parsePackageFile(emailContentInfoDTO, name, zipFilePath, emailFieldMap);
  154. }
  155. return fundNavDTOList;
  156. }
  157. private List<EmailFundNavDTO> parsePdfFile(String filePath, String excelFilePath, Map<String, List<String>> emailFieldMap) {
  158. excelFilePath = ExcelUtil.pdfConvertToExcel(filePath, excelFilePath);
  159. if (StrUtil.isBlank(excelFilePath)) {
  160. return CollUtil.newArrayList();
  161. }
  162. return parseExcelFile(excelFilePath, emailFieldMap);
  163. }
  164. /**
  165. * 解析邮件excel附件
  166. *
  167. * @param filePath 邮件excel附件地址
  168. * @param emailFieldMap 邮件字段识别规则映射表
  169. * @return 解析到的净值数据
  170. */
  171. private List<EmailFundNavDTO> parseExcelFile(String filePath, Map<String, List<String>> emailFieldMap) {
  172. Sheet sheet = ExcelUtil.getFirstSheet(filePath);
  173. if (sheet == null) {
  174. log.info("获取不到有效的sheet页面,文件路径:{}", filePath);
  175. return CollUtil.newArrayList();
  176. }
  177. // 1.找到表头所在位置
  178. Map<String, Pair<Integer, Integer>> fieldPositionMap = getFieldPosition(sheet, emailFieldMap);
  179. if (MapUtil.isEmpty(fieldPositionMap)) {
  180. log.warn("找不到文件表头字段 -> 文件:{}", filePath);
  181. return CollUtil.newArrayList();
  182. }
  183. // 2.解析sheet中的净值数据
  184. List<EmailFundNavDTO> emailFundNavDTOList = parseSheetData(filePath, sheet, fieldPositionMap, null);
  185. // 3.校验净值数据格式 并 设置数据校验不通过的原因
  186. if (CollUtil.isNotEmpty(emailFundNavDTOList)) {
  187. emailFundNavDTOList.forEach(e -> e.setFailReason(super.checkDataFailReason(e)));
  188. }
  189. return emailFundNavDTOList;
  190. }
  191. /**
  192. * 解析邮件正文
  193. *
  194. * @param emailContent 正文内容
  195. * @param emailFieldMap 邮件字段识别规则映射表
  196. * @return 解析到的净值数据
  197. */
  198. private List<EmailFundNavDTO> parseEmailContent(String emailContent, String excelFilePath, Map<String, List<String>> emailFieldMap) {
  199. excelFilePath = ExcelUtil.contentConvertToExcel(emailContent, excelFilePath);
  200. if (StrUtil.isBlank(excelFilePath)) {
  201. return CollUtil.newArrayList();
  202. }
  203. return parseExcelFile(excelFilePath, emailFieldMap);
  204. }
  205. /**
  206. * 根据字段所在表格的位置提取净值数据
  207. *
  208. * @param filePath 文件路径·
  209. * @param sheet 表格中的sheet页
  210. * @param fieldPositionMap 字段所在表格中的位置
  211. * @param direction 表格数据的形式:1-行,2-列
  212. * @return 净值数据
  213. */
  214. private List<EmailFundNavDTO> parseSheetData(String filePath, Sheet sheet, Map<String, Pair<Integer, Integer>> fieldPositionMap, Integer direction) {
  215. List<EmailFundNavDTO> fundNavDTOList = CollUtil.newArrayList();
  216. // 通过表头所在位置判断是行数据还是列数据
  217. Integer dataDirectionType = direction != null ? direction : ExcelUtil.detectDataDirection(fieldPositionMap);
  218. // 数据起始行,起始列
  219. int initRow = dataDirectionType.equals(EmailDataDirectionConst.ROW_DIRECTION_TYPE) ? fieldPositionMap.values().stream().map(Pair::getKey).max(Integer::compareTo).orElse(0)
  220. : fieldPositionMap.values().stream().map(Pair::getKey).min(Integer::compareTo).orElse(0);
  221. int initColumn = fieldPositionMap.values().stream().map(Pair::getValue).min(Integer::compareTo).orElse(0);
  222. if (dataDirectionType.equals(EmailDataDirectionConst.ROW_DIRECTION_TYPE)) {
  223. // 表头字段-列号映射关系
  224. Map<String, Integer> fieldColumnMap = getFieldRow(fieldPositionMap);
  225. int lastRowNum = sheet.getLastRowNum();
  226. // 遍历可能的数据行
  227. for (int rowNum = initRow + 1; rowNum <= lastRowNum; rowNum++) {
  228. Row sheetRow = sheet.getRow(rowNum);
  229. try {
  230. Optional.ofNullable(readSheetRowData(sheetRow, fieldColumnMap)).ifPresent(fundNavDTOList::addAll);
  231. } catch (Exception e) {
  232. log.error("读取行数据报错 -> 行号:{},文件路径:{},堆栈信息:{}", rowNum, filePath, ExceptionUtil.stacktraceToString(e));
  233. }
  234. }
  235. }
  236. if (dataDirectionType.equals(EmailDataDirectionConst.COLUMN_DIRECTION_TYPE)) {
  237. // 表头字段-行号映射关系
  238. Map<Integer, String> fieldRowMap = getRowField(fieldPositionMap);
  239. int lastRow = fieldPositionMap.values().stream().map(Pair::getKey).max(Integer::compareTo).orElse(0);
  240. // 遍历每一列
  241. for (int columnNum = initColumn + 1; columnNum < EmailDataDirectionConst.MAX_ROW_COLUMN; columnNum++) {
  242. Map<String, String> fieldValueMap = MapUtil.newHashMap();
  243. for (int rowNum = initRow; rowNum <= lastRow; rowNum++) {
  244. Row row = sheet.getRow(rowNum);
  245. Cell cell = row.getCell(columnNum);
  246. if (cell == null) {
  247. continue;
  248. }
  249. fieldValueMap.put(fieldRowMap.get(rowNum), ExcelUtil.getCellValue(cell));
  250. }
  251. Optional.ofNullable(buildEmailFundNavDTO(fieldValueMap)).ifPresent(fundNavDTOList::add);
  252. }
  253. }
  254. // 兼容净值日期为空的情况
  255. addPriceDateIfMiss(fundNavDTOList, getPriceDateFromSheet(sheet, initRow));
  256. return fundNavDTOList;
  257. }
  258. private void addPriceDateIfMiss(List<EmailFundNavDTO> fundNavDTOList, String priceDate) {
  259. if (fundNavDTOList.stream().map(EmailFundNavDTO::getPriceDate).allMatch(StrUtil::isBlank)) {
  260. fundNavDTOList.forEach(e -> e.setPriceDate(priceDate));
  261. }
  262. }
  263. private String getPriceDateFromSheet(Sheet sheet, Integer maxRowNum) {
  264. Map<Integer, String> priceDateMap = MapUtil.newHashMap();
  265. for (int rowNum = 0; rowNum < maxRowNum; rowNum++) {
  266. Row row = sheet.getRow(rowNum);
  267. if (row == null) {
  268. continue;
  269. }
  270. int lastCellNum = row.getLastCellNum();
  271. for (int columnNum = 0; columnNum < lastCellNum; columnNum++) {
  272. Cell cell = row.getCell(columnNum);
  273. if (cell == null) {
  274. continue;
  275. }
  276. String cellValue = ExcelUtil.getCellValue(cell);
  277. if (StrUtil.isNotBlank(cellValue) && cellValue.contains("截至")) {
  278. int index = cellValue.indexOf("截至");
  279. String date = cellValue.substring(index + 2, index + 2 + 10);
  280. if (StrUtil.isNotBlank(date)) {
  281. date = date.replaceAll("年", "-").replaceAll("月", "-");
  282. }
  283. priceDateMap.put(1, date);
  284. continue;
  285. }
  286. String priceDate = DateUtils.stringToDate(cellValue);
  287. if (StrUtil.isNotBlank(priceDate)) {
  288. priceDateMap.put(2, priceDate);
  289. }
  290. }
  291. }
  292. if (MapUtil.isNotEmpty(priceDateMap)) {
  293. Integer key = priceDateMap.keySet().stream().min(Integer::compareTo).orElse(null);
  294. return priceDateMap.get(key);
  295. }
  296. return null;
  297. }
  298. private EmailFundNavDTO buildEmailFundNavDTO(Map<String, String> fieldValueMap) {
  299. if (MapUtil.isEmpty(fieldValueMap) || fieldValueMap.values().stream().allMatch(StrUtil::isBlank)) {
  300. return null;
  301. }
  302. EmailFundNavDTO fundNavDTO = new EmailFundNavDTO();
  303. fundNavDTO.setFundName(fieldValueMap.get(EmailFieldConst.FUND_NAME));
  304. fundNavDTO.setRegisterNumber(fieldValueMap.get(EmailFieldConst.REGISTER_NUMBER));
  305. String priceDate = fieldValueMap.get(EmailFieldConst.PRICE_DATE);
  306. boolean isDateFormat = StrUtil.isNotBlank(priceDate) && StringUtil.isNumeric(priceDate) && StringUtil.compare2NumericValue(priceDate);
  307. if (isDateFormat) {
  308. priceDate = ExcelUtil.convertExcelDateToString(priceDate);
  309. }
  310. fundNavDTO.setPriceDate(priceDate);
  311. fundNavDTO.setNav(fieldValueMap.get(EmailFieldConst.NAV));
  312. fundNavDTO.setCumulativeNavWithdrawal(fieldValueMap.get(EmailFieldConst.CUMULATIVE_NAV_WITHDRAWAL));
  313. // pdf解析到的值带有",",比如:"10,656,097.37"
  314. String assetNet = fieldValueMap.get(EmailFieldConst.ASSET_NET);
  315. fundNavDTO.setAssetNet(ExcelUtil.numberDataStripCommas(assetNet));
  316. String assetShares = fieldValueMap.get(EmailFieldConst.ASSET_SHARE);
  317. fundNavDTO.setAssetShare(ExcelUtil.numberDataStripCommas(assetShares));
  318. return fundNavDTO;
  319. }
  320. private List<EmailFundNavDTO> readSheetRowData(Row sheetRow, Map<String, Integer> columnFieldMap) {
  321. if (sheetRow == null) {
  322. return null;
  323. }
  324. String nav = columnFieldMap.get(EmailFieldConst.NAV) != null && sheetRow.getCell(columnFieldMap.get(EmailFieldConst.NAV)) != null
  325. ? ExcelUtil.getCellValue(sheetRow.getCell(columnFieldMap.get(EmailFieldConst.NAV))) : null;
  326. String cumulativeNavWithdrawal = columnFieldMap.get(EmailFieldConst.CUMULATIVE_NAV_WITHDRAWAL) != null && sheetRow.getCell(columnFieldMap.get(EmailFieldConst.CUMULATIVE_NAV_WITHDRAWAL)) != null ?
  327. ExcelUtil.getCellValue(sheetRow.getCell(columnFieldMap.get(EmailFieldConst.CUMULATIVE_NAV_WITHDRAWAL))) : null;
  328. String assetNet = columnFieldMap.get(EmailFieldConst.ASSET_NET) != null && sheetRow.getCell(columnFieldMap.get(EmailFieldConst.ASSET_NET)) != null ?
  329. ExcelUtil.getCellValue(sheetRow.getCell(columnFieldMap.get(EmailFieldConst.ASSET_NET))) : null;
  330. List<EmailFundNavDTO> fundNavDTOList = CollUtil.newArrayList();
  331. EmailFundNavDTO emailFundNavDTO = new EmailFundNavDTO();
  332. String priceDate = columnFieldMap.get(EmailFieldConst.PRICE_DATE) != null && sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PRICE_DATE)) != null ?
  333. ExcelUtil.getCellValue(sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PRICE_DATE))) : null;
  334. boolean isDateFormat = StrUtil.isNotBlank(priceDate) && StringUtil.isNumeric(priceDate) && StringUtil.compare2NumericValue(priceDate);
  335. if (isDateFormat) {
  336. priceDate = ExcelUtil.convertExcelDateToString(priceDate);
  337. }
  338. priceDate = DateUtils.stringToDate(priceDate);
  339. // 份额基金净值文件格式
  340. long parentFiledCount = columnFieldMap.keySet().stream().filter(e -> e.contains("parent")).count();
  341. if (parentFiledCount >= 1) {
  342. Optional.ofNullable(buildParentNav(sheetRow, columnFieldMap, priceDate)).ifPresent(fundNavDTOList::add);
  343. }
  344. emailFundNavDTO.setPriceDate(priceDate);
  345. String fundName = ExcelUtil.getPriorityFieldValue(sheetRow, columnFieldMap.get(EmailFieldConst.LEVEL_FUND_NAME), columnFieldMap.get(EmailFieldConst.FUND_NAME));
  346. emailFundNavDTO.setFundName(fundName);
  347. String registerNumber = ExcelUtil.getPriorityFieldValue(sheetRow, columnFieldMap.get(EmailFieldConst.LEVEL_REGISTER_NUMBER), columnFieldMap.get(EmailFieldConst.REGISTER_NUMBER));
  348. emailFundNavDTO.setRegisterNumber(registerNumber);
  349. emailFundNavDTO.setNav(nav);
  350. emailFundNavDTO.setCumulativeNavWithdrawal(cumulativeNavWithdrawal);
  351. String virtualNav = columnFieldMap.get(EmailFieldConst.VIRTUAL_NAV) != null && sheetRow.getCell(columnFieldMap.get(EmailFieldConst.VIRTUAL_NAV)) != null ?
  352. ExcelUtil.getCellValue(sheetRow.getCell(columnFieldMap.get(EmailFieldConst.VIRTUAL_NAV))) : null;
  353. emailFundNavDTO.setVirtualNav(virtualNav);
  354. emailFundNavDTO.setAssetNet(ExcelUtil.numberDataStripCommas(assetNet));
  355. String assetShares = columnFieldMap.get(EmailFieldConst.ASSET_SHARE) != null && sheetRow.getCell(columnFieldMap.get(EmailFieldConst.ASSET_SHARE)) != null ?
  356. ExcelUtil.getCellValue(sheetRow.getCell(columnFieldMap.get(EmailFieldConst.ASSET_SHARE))) : null;
  357. emailFundNavDTO.setAssetShare(ExcelUtil.numberDataStripCommas(assetShares));
  358. fundNavDTOList.add(emailFundNavDTO);
  359. return fundNavDTOList;
  360. }
  361. private EmailFundNavDTO buildParentNav(Row sheetRow, Map<String, Integer> columnFieldMap, String priceDate) {
  362. EmailFundNavDTO emailFundNavDTO = new EmailFundNavDTO();
  363. String nav = columnFieldMap.get(EmailFieldConst.PARENT_NAV) != null && sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_NAV)) != null ?
  364. ExcelUtil.getCellValue(sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_NAV))) : null;
  365. String cumulativeNavWithdrawal = columnFieldMap.get(EmailFieldConst.PARENT_CUMULATIVE_NAV_WITHDRAWAL) != null && sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_CUMULATIVE_NAV_WITHDRAWAL)) != null ?
  366. ExcelUtil.getCellValue(sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_CUMULATIVE_NAV_WITHDRAWAL))) : null;
  367. if (StrUtil.isBlank(nav) && StrUtil.isBlank(cumulativeNavWithdrawal)) {
  368. return null;
  369. }
  370. emailFundNavDTO.setPriceDate(priceDate);
  371. String fundName = columnFieldMap.get(EmailFieldConst.PARENT_FUND_NAME) != null && sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_FUND_NAME)).getStringCellValue() != null ?
  372. ExcelUtil.getCellValue(sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_FUND_NAME))) : null;
  373. emailFundNavDTO.setFundName(fundName);
  374. String registerNumber = columnFieldMap.get(EmailFieldConst.PARENT_REGISTER_NUMBER) != null && sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_REGISTER_NUMBER)) != null ?
  375. ExcelUtil.getCellValue(sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_REGISTER_NUMBER))) : null;
  376. emailFundNavDTO.setRegisterNumber(registerNumber);
  377. emailFundNavDTO.setNav(nav);
  378. emailFundNavDTO.setCumulativeNavWithdrawal(cumulativeNavWithdrawal);
  379. String virtualNav = columnFieldMap.get(EmailFieldConst.PARENT_VIRTUAL_NAV) != null && sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_VIRTUAL_NAV)) != null ?
  380. ExcelUtil.getCellValue(sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_VIRTUAL_NAV))) : null;
  381. emailFundNavDTO.setVirtualNav(virtualNav);
  382. String assetNet = columnFieldMap.get(EmailFieldConst.PARENT_ASSET_NET) != null && sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_ASSET_NET)) != null ?
  383. ExcelUtil.getCellValue(sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_ASSET_NET))) : null;
  384. emailFundNavDTO.setAssetNet(ExcelUtil.numberDataStripCommas(assetNet));
  385. String assetShares = columnFieldMap.get(EmailFieldConst.PARENT_ASSET_SHARE) != null && sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_ASSET_SHARE)) != null ?
  386. ExcelUtil.getCellValue(sheetRow.getCell(columnFieldMap.get(EmailFieldConst.PARENT_ASSET_SHARE))) : null;
  387. emailFundNavDTO.setAssetShare(ExcelUtil.numberDataStripCommas(assetShares));
  388. return emailFundNavDTO;
  389. }
  390. private Map<String, Integer> getFieldRow(Map<String, Pair<Integer, Integer>> fieldPositionMap) {
  391. // 考虑日期字段识别逻辑的问题
  392. long rowNumCount = fieldPositionMap.values().stream().map(Pair::getKey).distinct().count();
  393. if (rowNumCount > 1) {
  394. // 存在合并单元格的方式 -> 日期字段所在位置可能会存在错误
  395. Pair<Integer, Integer> priceDatePair = fieldPositionMap.get(EmailFieldConst.PRICE_DATE);
  396. //补丁,如果存在合并单元格,判断日期所在的行是否有其他字段列,如果存在,则表名是行格式数据,而不是其他格式数据
  397. if(priceDatePair != null){
  398. List<Integer> pairKey = fieldPositionMap.values().stream().map(Pair::getKey).collect(Collectors.toList());
  399. List<Integer> priceDateKey = pairKey.stream().filter(e -> e == priceDatePair.getKey()).collect(Collectors.toList());
  400. if(priceDateKey.size() < 2){
  401. fieldPositionMap.remove(EmailFieldConst.PRICE_DATE);
  402. }
  403. }
  404. }
  405. Map<String, Integer> fieldRowMap = MapUtil.newHashMap();
  406. for (Map.Entry<String, Pair<Integer, Integer>> fieldPositionEntry : fieldPositionMap.entrySet()) {
  407. String field = fieldPositionEntry.getKey();
  408. Integer column = fieldPositionEntry.getValue().getValue();
  409. fieldRowMap.put(field, column);
  410. }
  411. return fieldRowMap;
  412. }
  413. private Map<Integer, String> getRowField(Map<String, Pair<Integer, Integer>> fieldPositionMap) {
  414. Map<Integer, String> fieldRowMap = MapUtil.newHashMap();
  415. for (Map.Entry<String, Pair<Integer, Integer>> fieldPositionEntry : fieldPositionMap.entrySet()) {
  416. String field = fieldPositionEntry.getKey();
  417. Integer column = fieldPositionEntry.getValue().getKey();
  418. fieldRowMap.put(column, field);
  419. }
  420. return fieldRowMap;
  421. }
  422. /**
  423. * 找出excel中表头所在的位置
  424. *
  425. * @param sheet 表格工作簿
  426. * @param emailFieldMap 邮件字段识别规则映射表
  427. * @return excel中表头所在的位置(行, 列)
  428. */
  429. private Map<String, Pair<Integer, Integer>> getFieldPosition(Sheet sheet, Map<String, List<String>> emailFieldMap) {
  430. Map<String, List<FieldPositionDTO>> tempFieldPositionMap = MapUtil.newHashMap();
  431. int lastRowNum = sheet.getLastRowNum();
  432. for (int rowNum = 0; rowNum <= lastRowNum; rowNum++) {
  433. Row sheetRow = sheet.getRow(rowNum);
  434. if (sheetRow == null) {
  435. continue;
  436. }
  437. int lastCellNum = sheetRow.getLastCellNum();
  438. for (int cellNum = 0; cellNum < lastCellNum; cellNum++) {
  439. Cell cell = sheetRow.getCell(cellNum);
  440. if (cell == null) {
  441. continue;
  442. }
  443. String cellValue = ExcelUtil.getCellValue(cell);
  444. // 移除掉非中文字符
  445. String newCellValue = StringUtil.retainChineseCharacters(cellValue, NOT_CONVERT_FIELD_LIST);
  446. String field = fieldMatch(newCellValue, emailFieldMap);
  447. if (StrUtil.isNotBlank(field)) {
  448. List<FieldPositionDTO> fieldPositionDTOList = tempFieldPositionMap.getOrDefault(field, new ArrayList<>());
  449. fieldPositionDTOList.add(new FieldPositionDTO(newCellValue, Pair.of(rowNum, cellNum)));
  450. tempFieldPositionMap.put(field, fieldPositionDTOList);
  451. }
  452. }
  453. }
  454. // 判断是不是份额基金净值文件格式(同时存在两个备案编码字段)
  455. return handlerFieldPosition(tempFieldPositionMap);
  456. }
  457. private Map<String, Pair<Integer, Integer>> handlerFieldPosition(Map<String, List<FieldPositionDTO>> tempFieldPositionMap) {
  458. Map<String, Pair<Integer, Integer>> fieldPositionMap = MapUtil.newHashMap();
  459. boolean hasParentField = tempFieldPositionMap.keySet().stream().anyMatch(e -> e.contains("parent"));
  460. for (Map.Entry<String, List<FieldPositionDTO>> entry : tempFieldPositionMap.entrySet()) {
  461. String field = entry.getKey();
  462. List<FieldPositionDTO> fieldPositionDTOList = entry.getValue();
  463. int size = fieldPositionDTOList.size();
  464. if (size == 1) {
  465. fieldPositionMap.put(field, fieldPositionDTOList.get(0).getPair());
  466. continue;
  467. }
  468. if ((!hasParentField && size > 1)) {
  469. if (EmailFieldConst.REGISTER_NUMBER.equals(field)) {
  470. Pair<Integer, Integer> pair = fieldPositionDTOList.stream()
  471. .filter(e -> !e.getFieldValue().contains("协会") && !e.getFieldValue().contains("备案")).map(FieldPositionDTO::getPair).findFirst().orElse(null);
  472. fieldPositionMap.put(field, pair);
  473. } else {
  474. fieldPositionMap.put(field, fieldPositionDTOList.get(size - 1).getPair());
  475. }
  476. continue;
  477. }
  478. if ((hasParentField && size > 1)) {
  479. fieldPositionMap.put(field, fieldPositionDTOList.get(0).getPair());
  480. }
  481. }
  482. // 母基金缺少代码的情况
  483. if (hasParentField && fieldPositionMap.get(EmailFieldConst.PARENT_REGISTER_NUMBER) == null) {
  484. List<FieldPositionDTO> fieldPositionDTOS = tempFieldPositionMap.get(EmailFieldConst.REGISTER_NUMBER);
  485. if (CollUtil.isNotEmpty(fieldPositionDTOS)) {
  486. Pair<Integer, Integer> parentRegisterNumberPair = fieldPositionDTOS.stream()
  487. .filter(e -> e.getFieldValue().contains("协会") || e.getFieldValue().contains("备案")).map(FieldPositionDTO::getPair).findFirst().orElse(null);
  488. fieldPositionMap.put(EmailFieldConst.PARENT_REGISTER_NUMBER, parentRegisterNumberPair);
  489. }
  490. }
  491. return fieldPositionMap;
  492. }
  493. /**
  494. * 判断单元格值是否为表头字段
  495. *
  496. * @param cellValue 单元格值
  497. * @param emailFieldMap 邮件字段识别规则映射表
  498. * @return 表头对应的标识
  499. */
  500. public String fieldMatch(String cellValue, Map<String, List<String>> emailFieldMap) {
  501. if (StrUtil.isBlank(cellValue)) {
  502. return null;
  503. }
  504. for (Map.Entry<String, List<String>> fieldEntry : emailFieldMap.entrySet()) {
  505. List<String> fieldList = fieldEntry.getValue();
  506. for (String field : fieldList) {
  507. if (cellValue.equals(field)) {
  508. return fieldEntry.getKey();
  509. }
  510. }
  511. }
  512. return null;
  513. }
  514. }