public void start(EmitKey key) {
super.start(key);
// TODO: add a clear function to the bloom filter in Hadoop and use it
// here instead of instantiating a new one for every key
this.filter = new DynamicBloomFilter(this.vectorSize, DistinctAggregator.HASH_COUNT, Hash.MURMUR_HASH, (int) this.getArg());
}