You can use apache poi library to rad the DOC file content. See the following code snippet to read DOC file using apache poi´s library:
DocReader.java:
-------------------------------------------------
package in.anyforum;
import java.io.*;
import org.apache.poi.hwpf.HWPFDocument;
import org.apache.poi.hwpf.extractor.WordExtractor;
public class DocReader
{
public static void main(String[] args)
{
File file = null;
WordExtractor extractor = null;
try
{
file = new File("File.doc");
FileInputStream fis = new FileInputStream(file.getAbsolutePath());
HWPFDocument document = new HWPFDocument(fis);
extractor = new WordExtractor(document);
String[] fileData = extractor.getParagraphText();
for (int i = 0; i < fileData.length; i++)
{
if (fileData[i] != null)
System.out.println(fileData[i]);
}
}
catch (Exception exep)
{
exep.printStackTrace();
}
}
}
Click Here to download Apache POI Jar