java读取words

helei 2020-5-21 894 5/21
maven引入
<dependency>
				<groupId>org.apache.poi</groupId>
				<artifactId>poi-ooxml</artifactId>
				<version>3.8</version>
		</dependency>
		 
		<dependency>
				<groupId>org.apache.poi</groupId>
				<artifactId>poi-scratchpad</artifactId>
				<version>3.8</version>
		</dependency>
public static String readWord(String path) {
			String buffer = "";
			try {
				if (path.endsWith(".doc")) {
					FileInputStream is = new FileInputStream(path);
					WordExtractor ex = new WordExtractor(is);
					buffer = ex.getText();
					is.close();
				} else if (path.endsWith("docx")) {
					OPCPackage opcPackage = POIXMLDocument.openPackage(path);
					POIXMLTextExtractor extractor = new XWPFWordExtractor(opcPackage);
					buffer = extractor.getText();
					opcPackage.close();
				} else {
					System.out.println("此文件不是word文件!");
				}
	 
			} catch (Exception e) {
				e.printStackTrace();
			}
			return buffer;
		}
- THE END -

helei

5月21日15:24

最后修改:2020年5月21日
0

非特殊说明,本博所有文章均为博主原创。