public Document readDocument(String lang1, String lang2, File file) throws IOException {
Document document = new Document();
FileReader in = new FileReader(file);
try {
Html2Text parser = new Html2Text();
parser.parse(in);
String text = parser.getText();
if (text != null) {
int size = text.length();
String[] lines = text.split("\n");