zoukankan      html  css  js  c++  java
  • Using POI to replace elements in WORD(.docx/.doc)(使用POI替换word中的特定字符/文字)【改进】

    上一篇文章可能有点bug,这个是改进

    package com.xfzx.test.POI.main;
    
    import java.io.File;
    import java.io.FileInputStream;
    import java.io.FileNotFoundException;
    import java.io.FileOutputStream;
    import java.io.IOException;
    import java.io.InputStream;
    import java.util.ArrayList;
    import java.util.HashMap;
    import java.util.Iterator;
    import java.util.List;
    import java.util.Map;
    import java.util.Map.Entry;
    import java.util.regex.Matcher;
    import java.util.regex.Pattern;
    
    import org.apache.poi.POIXMLDocument;
    import org.apache.poi.hwpf.HWPFDocument;
    import org.apache.poi.hwpf.usermodel.Range;
    import org.apache.poi.xwpf.usermodel.XWPFDocument;
    import org.apache.poi.xwpf.usermodel.XWPFParagraph;
    import org.apache.poi.xwpf.usermodel.XWPFRun;
    import org.apache.poi.xwpf.usermodel.XWPFTable;
    import org.apache.poi.xwpf.usermodel.XWPFTableCell;
    import org.apache.poi.xwpf.usermodel.XWPFTableRow;
    
    public class WordPOI {
    
        // 返回Docx中需要替换的特殊字符,没有重复项
        // 推荐传入正则表达式参数"\\$\\{[^{}]+\\}"
        public ArrayList<String> getReplaceElementsInWord(String filePath,
                String regex) {
            String[] p = filePath.split("\\.");
            if (p.length > 0) {// 判断文件有无扩展名
                // 比较文件扩展名
                if (p[p.length - 1].equalsIgnoreCase("doc")) {
                    ArrayList<String> al = new ArrayList<>();
                    File file = new File(filePath);
                    HWPFDocument document = null;
                    try {
                        InputStream is = new FileInputStream(file);
                        document = new HWPFDocument(is);
                    } catch (FileNotFoundException e) {
                        e.printStackTrace();
                    } catch (IOException e) {
                        e.printStackTrace();
                    }
                    Range range = document.getRange();
                    String rangeText = range.text();
                    CharSequence cs = rangeText.subSequence(0, rangeText.length());
                    Pattern pattern = Pattern.compile(regex);
                    Matcher matcher = pattern.matcher(cs);
                    int startPosition = 0;
                    while (matcher.find(startPosition)) {
                        if (!al.contains(matcher.group())) {
                            al.add(matcher.group());
                        }
                        startPosition = matcher.end();
                    }
                    return al;
                } else if (p[p.length - 1].equalsIgnoreCase("docx")) {
                    ArrayList<String> al = new ArrayList<>();
                    XWPFDocument document = null;
                    try {
                        document = new XWPFDocument(
                                POIXMLDocument.openPackage(filePath));
                    } catch (IOException e) {
                        e.printStackTrace();
                    }
                    // 遍历段落
                    Iterator<XWPFParagraph> itPara = document
                            .getParagraphsIterator();
                    while (itPara.hasNext()) {
                        XWPFParagraph paragraph = (XWPFParagraph) itPara.next();
                        String paragraphString = paragraph.getText();
                        CharSequence cs = paragraphString.subSequence(0,
                                paragraphString.length());
                        Pattern pattern = Pattern.compile(regex);
                        Matcher matcher = pattern.matcher(cs);
                        int startPosition = 0;
                        while (matcher.find(startPosition)) {
                            if (!al.contains(matcher.group())) {
                                al.add(matcher.group());
                            }
                            startPosition = matcher.end();
                        }
                    }
                    // 遍历表
                    Iterator<XWPFTable> itTable = document.getTablesIterator();
                    while (itTable.hasNext()) {
                        XWPFTable table = (XWPFTable) itTable.next();
                        int rcount = table.getNumberOfRows();
                        for (int i = 0; i < rcount; i++) {
                            XWPFTableRow row = table.getRow(i);
                            List<XWPFTableCell> cells = row.getTableCells();
                            for (XWPFTableCell cell : cells) {
                                String cellText = "";
                                cellText = cell.getText();
                                CharSequence cs = cellText.subSequence(0,
                                        cellText.length());
                                Pattern pattern = Pattern.compile(regex);
                                Matcher matcher = pattern.matcher(cs);
                                int startPosition = 0;
                                while (matcher.find(startPosition)) {
                                    if (!al.contains(matcher.group())) {
                                        al.add(matcher.group());
                                    }
                                    startPosition = matcher.end();
                                }
                            }
                        }
                    }
                    return al;
                } else {
                    return null;
                }
            } else {
                return null;
            }
        }
    
        // 替换word中需要替换的特殊字符
        public static boolean replaceAndGenerateWord(String srcPath,
                String destPath, Map<String, String> map) {
            String[] sp = srcPath.split("\\.");
            String[] dp = destPath.split("\\.");
            if ((sp.length > 0) && (dp.length > 0)) {// 判断文件有无扩展名
                // 比较文件扩展名
                if (sp[sp.length - 1].equalsIgnoreCase("docx")) {
                    try {
                        XWPFDocument document = new XWPFDocument(
                                POIXMLDocument.openPackage(srcPath));
                        // 替换段落中的指定文字
                        Iterator<XWPFParagraph> itPara = document
                                .getParagraphsIterator();
                        while (itPara.hasNext()) {
                            XWPFParagraph paragraph = (XWPFParagraph) itPara.next();
                            List<XWPFRun> runs = paragraph.getRuns();
                            for (int i = 0; i < runs.size(); i++) {
                                String oneparaString = runs.get(i).getText(
                                        runs.get(i).getTextPosition());
                                for (Map.Entry<String, String> entry : map
                                        .entrySet()) {
                                    oneparaString = oneparaString.replace(
                                            entry.getKey(), entry.getValue());
                                }
                                runs.get(i).setText(oneparaString, 0);
                            }
                        }
    
                        // 替换表格中的指定文字
                        Iterator<XWPFTable> itTable = document.getTablesIterator();
                        while (itTable.hasNext()) {
                            XWPFTable table = (XWPFTable) itTable.next();
                            int rcount = table.getNumberOfRows();
                            for (int i = 0; i < rcount; i++) {
                                XWPFTableRow row = table.getRow(i);
                                List<XWPFTableCell> cells = row.getTableCells();
                                for (XWPFTableCell cell : cells) {
                                    String cellTextString = cell.getText();
                                    for (Entry<String, String> e : map.entrySet()) {
                                        if (cellTextString.contains(e.getKey()))
                                            cellTextString = cellTextString
                                                    .replace(e.getKey(),
                                                            e.getValue());
                                    }
                                    cell.removeParagraph(0);
                                    cell.setText(cellTextString);
                                }
                            }
                        }
                        FileOutputStream outStream = null;
                        outStream = new FileOutputStream(destPath);
                        document.write(outStream);
                        outStream.close();
                        return true;
                    } catch (Exception e) {
                        e.printStackTrace();
                        return false;
                    }
    
                } else
                // doc只能生成doc,如果生成docx会出错
                if ((sp[sp.length - 1].equalsIgnoreCase("doc"))
                        && (dp[dp.length - 1].equalsIgnoreCase("doc"))) {
                    HWPFDocument document = null;
                    try {
                        document = new HWPFDocument(new FileInputStream(srcPath));
                        Range range = document.getRange();
                        for (Map.Entry<String, String> entry : map.entrySet()) {
                            range.replaceText(entry.getKey(), entry.getValue());
                        }
                        FileOutputStream outStream = null;
                        outStream = new FileOutputStream(destPath);
                        document.write(outStream);
                        outStream.close();
                        return true;
                    } catch (FileNotFoundException e) {
                        e.printStackTrace();
                        return false;
                    } catch (IOException e) {
                        e.printStackTrace();
                        return false;
                    }
                } else {
                    return false;
                }
            } else {
                return false;
            }
        }
    
        public static void main(String[] args) {
            // TODO Auto-generated method stub
            String filepathString = "D:/2.doc";
            String destpathString = "D:/2ttt.doc";
            Map<String, String> map = new HashMap<String, String>();
            map.put("${NAME}", "王五王五啊王力宏的辣味回答侯卫东拉网");
            map.put("${NsAME}", "王五王五啊王力味回答侯卫东拉网");
            map.put("${NAMaE}", "王五王五啊王力宏侯卫东拉网");
            map.put("${NArME}", "王五王五啊王力宏的辣味回答东拉网");
            map.put("${NwAME}", "王五王五啊王的辣味回答侯卫东拉网");
            map.put("${NA4ME}", "王五王五啊王力侯卫东拉网");
            map.put("${N5AME}", "王五王五辣味回答侯卫东拉网");
            map.put("${NAadwME}", "王五力宏的辣味回答侯卫东拉网");
            System.out.println(replaceAndGenerateWord(filepathString,
                    destpathString, map));
        }
    }
  • 相关阅读:
    2016.6.26考试
    爆搜。。。。。。。
    9.18目标
    9.17水题总结
    9.16测试
    9.10考试
    jzoj P1163 生日派对灯
    9.04考试总结
    8/8刷题记录
    a[i++]
  • 原文地址:https://www.cnblogs.com/hold/p/2959452.html
Copyright © 2011-2022 走看看