public void configure(JobConf job) {
curTime = job.getLong(CRAWL_GEN_CUR_TIME, System.currentTimeMillis());
limit = job.getLong(CRAWL_TOP_N,Long.MAX_VALUE)/job.getNumReduceTasks();
maxPerHost = job.getInt(GENERATE_MAX_PER_HOST, -1);
byIP = job.getBoolean(GENERATE_MAX_PER_HOST_BY_IP, false);
filters = new URLFilters(job);
normalizers = new URLNormalizers(job, URLNormalizers.SCOPE_GENERATE_HOST_COUNT);
scfilters = new ScoringFilters(job);
hostPartitioner.configure(job);
filter = job.getBoolean(CRAWL_GENERATE_FILTER, true);
genDelay = job.getLong(CRAWL_GEN_DELAY, 7L) * 3600L * 24L * 1000L;