Package org.fastlsh.hash

Source Code of org.fastlsh.hash.HashFamily

/*
   Copyright 2012 Michael Mastroianni, Amol Kapila (fastlsh.org)
    Licensed under the Apache License, Version 2.0 (the "License");
    you may not use this file except in compliance with the License.
    You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

    Unless required by applicable law or agreed to in writing, software
    distributed under the License is distributed on an "AS IS" BASIS,
    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    See the License for the specific language governing permissions and
   limitations under the License.
*/

package org.fastlsh.hash;


import java.io.Serializable;
import java.util.Random;

import org.fastlsh.index.VectorWithId;
import org.fastlsh.util.BitSet;


public class HashFamily implements Serializable
{
  private static final long serialVersionUID = -7319322808317106833L;
 
  HashFunction [] hashes;
    public HashFamily(HashFunction [] hs)
    {
        hashes = hs;
    }
   
    /**
     * Generates the LSH signature corresponding to the input data vector and the family of hash functions.
     * @param input the input vector whose signature is desired
     * @return the LSH signature for the input vector
     */
    public BitSet makeSignature(VectorWithId input)
    {
        BitSet retval = new BitSet(hashes.length);
        for(int i = 0, max = hashes.length; i < max; i++)
        {
            retval.set(i, hashes[i].hash(input));
        }
        return retval;
    }

  /**
   * Makes an LSH family for cosine similarity.
   * @param dimension the dimension of the data vectors to be hashed
   * @param familySize the number of hash functions to include in the family
   * @return an array containing the functions comprising the family
   */
  public static HashFamily getCosineHashFamily(int dimension, int familySize)
  {
      HashFunction [] fns = new HashFunction[familySize];
      Random rand = new Random();
      for (int i = 0; i < familySize; i++) fns[i] = new CosineHash(dimension, rand);
      return new HashFamily(fns);
  }
 
  /**
   * Makes an LSH family for Euclidean (L2) distance.
   * @param dimension the dimension of the data vectors to be hashed
   * @param familySize the number of hash functions to include in the family
   * @return an array containing the functions comprising the family
   */
  public static HashFamily getL2HashFamily(int dimension, int familySize)
  {
      HashFunction [] fns = new HashFunction[familySize];
      Random rand = new Random();
      for (int i = 0; i < familySize; i++) fns[i] = new L2Hash(dimension, rand);
      return new HashFamily(fns);
  }
}
TOP

Related Classes of org.fastlsh.hash.HashFamily

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.