// We now have plain text format
List<String> lines = FileUtils.readLines(outputFile);
Map<String,Double> idfValues = new HashMap<String,Double>();
CharacterNGramMeasure measure = new CharacterNGramMeasure(n, new HashMap<String, Double>());
// Get n-gram representations of texts
List<Set<String>> docs = new ArrayList<Set<String>>();
for (String line : lines)
{
Set<String> ngrams = measure.getNGrams(line);
docs.add(ngrams);
}
// Get all ngrams