소스 검색

更新化学试题,测试table识别

zengxj 5 년 전
부모
커밋
1e1063a8cb
3개의 변경된 파일34개의 추가작업 그리고 0개의 파일을 삭제
  1. BIN
      doc/table.docx
  2. BIN
      doc/化学中考专项诊断.docx
  3. 34 0
      src/test/java/com/yaoxiang/diagnosis/service/WordTest.java

BIN
doc/table.docx


BIN
doc/化学中考专项诊断.docx


+ 34 - 0
src/test/java/com/yaoxiang/diagnosis/service/WordTest.java

@@ -0,0 +1,34 @@
+package com.yaoxiang.diagnosis.service;
+
+import com.yaoxiang.diagnosis.word.WordUtil;
+import org.apache.poi.xwpf.usermodel.XWPFDocument;
+import org.apache.poi.xwpf.usermodel.XWPFParagraph;
+import org.junit.Test;
+import org.springframework.util.FileCopyUtils;
+
+import java.io.ByteArrayOutputStream;
+import java.io.File;
+import java.io.FileInputStream;
+import java.io.InputStream;
+import java.util.List;
+
+public class WordTest {
+
+    @Test
+    public void test() throws Exception{
+        ByteArrayOutputStream baos = new ByteArrayOutputStream();
+        File file = new File("doc/table.docx");
+        InputStream is = new FileInputStream(file);
+        FileCopyUtils.copy(is, baos);
+        is.close();
+        byte[] data = baos.toByteArray();
+        XWPFDocument document = WordUtil.open(data);
+        List<XWPFParagraph> paragraphs = document.getParagraphs();
+        for (XWPFParagraph paragraph:paragraphs){
+            System.out.println(paragraph.getCTP().xmlText());
+            System.out.println(paragraph.getCTP().isImmutable());
+            System.out.println(paragraph.toString());
+        }
+
+    }
+}