一般文本文件
我们以日志文件.log文件为例:
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
|
import java.io.BufferedReader; import java.io.File; import java.io.FileInputStream; import java.io.FileNotFoundException; import java.io.FileReader; import java.io.IOException; public class File_Test { /** * @param args */ public static void main(String[] args) { File file = new File( "D:\\logserrorMsg.log" ); if (file.exists()){ System.out.println( "此文件存在" ); } else { System.out.println( "此文件不存在" ); } try { FileReader fr = new FileReader(file); BufferedReader br = new BufferedReader(fr); String s; while ((s=br.readLine())!= null ){ System.out.println(s); } System.out.println( "文件大小为(MB):" + new FileInputStream(file).available() / 1024 / 1024 + "M" ); } catch (FileNotFoundException e) { e.printStackTrace(); } catch (IOException e) { e.printStackTrace(); } } } |
.doc文件
这里我们使用WordExtractor读取Word文档,WordExtractor来自于Apache的poi类库项目,官方下载地址:https://poi.apache.org/download.html
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
|
import java.io.FileInputStream; import org.textmining.text.extraction.WordExtractor; public class WordTest { public static void main(String args[]) throws Exception { new WordTest().readByOther(); } public void readByText() throws Exception { FileInputStream in = new FileInputStream( "C://test.doc " ); WordExtractor extractor = new WordExtractor(); String str = extractor.extractText(in); System.out.println(str); } } |