读取PDF文件jar引用
1
2
3
4
5
|
<dependency> <groupid>org.apache.pdfbox</groupid> pdfbox</artifactid> <version> 1.8 . 13 </version> </dependency> |
读取WORD文件jar引用
1
2
3
4
5
6
7
8
9
10
|
<dependency> <groupid>org.apache.poi</groupid> poi-scratchpad</artifactid> <version> 3.16 -beta1</version> </dependency> <dependency> <groupid>org.apache.poi</groupid> poi</artifactid> <version> 3.16 -beta1</version> </dependency> |
读取WORD文件方法
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
|
/** * * @Title: getTextFromWord * @Description: 读取word * @param filePath * 文件路径 * @return: String 读出的Word的内容 */ public static String getTextFromWord(String filePath) { String result = null ; File file = new File(filePath); FileInputStream fis = null ; try { fis = new FileInputStream(file); @SuppressWarnings ( "resource" ) WordExtractor wordExtractor = new WordExtractor(fis); result = wordExtractor.getText(); } catch (FileNotFoundException e) { e.printStackTrace(); } catch (IOException e) { e.printStackTrace(); } finally { if (fis != null ) { try { fis.close(); } catch (IOException e) { e.printStackTrace(); } } } return result; } |
读取PDF文件方法
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
|
/** * * @Title: getTextFromPdf * @Description: 读取pdf文件内容 * @param filePath * @return: 读出的pdf的内容 */ public static String getTextFromPdf(String filePath) { String result = null ; FileInputStream is = null ; PDDocument document = null ; try { is = new FileInputStream(filePath); PDFParser parser = new PDFParser(is); parser.parse(); document = parser.getPDDocument(); PDFTextStripper stripper = new PDFTextStripper(); result = stripper.getText(document); } catch (FileNotFoundException e) { e.printStackTrace(); } catch (IOException e) { e.printStackTrace(); } finally { if (is != null ) { try { is.close(); } catch (IOException e) { e.printStackTrace(); } } if (document != null ) { try { document.close(); } catch (IOException e) { e.printStackTrace(); } } } return result; } |
希望本篇实例代码可以帮到您
原文链接:http://www.2cto.com/kf/201701/584974.html