getRawTextFromUrlIfNeeded(doc, feedConfig);
// (if transforming full text then grab the raw body from the URL if necessary)
cachedFullText = doc.getFullText();
}//TESTED (by hand)
}
SimpleTextCleanserPojo mappedTextExtractor = new SimpleTextCleanserPojo();
mappedTextExtractor.setField(textExtractor.fieldName);
mappedTextExtractor.setFlags(textExtractor.flags);
mappedTextExtractor.setScript(textExtractor.script);
mappedTextExtractor.setScriptlang(textExtractor.scriptlang);
mappedTextExtractor.setReplacement(textExtractor.replacement);
mappedTextExtractors.add(mappedTextExtractor);
}
this.cleanseText(mappedTextExtractors, doc);
return cachedFullText;