Package org.eclipse.jgit.internal.storage.file

Source Code of org.eclipse.jgit.internal.storage.file.PackReverseIndex

/*
* Copyright (C) 2008, Marek Zawirski <marek.zawirski@gmail.com>
* and other copyright owners as documented in the project's IP log.
*
* This program and the accompanying materials are made available
* under the terms of the Eclipse Distribution License v1.0 which
* accompanies this distribution, is reproduced below, and is
* available at http://www.eclipse.org/org/documents/edl-v10.php
*
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or
* without modification, are permitted provided that the following
* conditions are met:
*
* - Redistributions of source code must retain the above copyright
*   notice, this list of conditions and the following disclaimer.
*
* - Redistributions in binary form must reproduce the above
*   copyright notice, this list of conditions and the following
*   disclaimer in the documentation and/or other materials provided
*   with the distribution.
*
* - Neither the name of the Eclipse Foundation, Inc. nor the
*   names of its contributors may be used to endorse or promote
*   products derived from this software without specific prior
*   written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
* CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
* INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
* NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
* CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
* STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
* ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/

package org.eclipse.jgit.internal.storage.file;

import java.text.MessageFormat;

import org.eclipse.jgit.errors.CorruptObjectException;
import org.eclipse.jgit.internal.JGitText;
import org.eclipse.jgit.internal.storage.file.PackIndex.MutableEntry;
import org.eclipse.jgit.lib.ObjectId;

/**
* <p>
* Reverse index for forward pack index. Provides operations based on offset
* instead of object id. Such offset-based reverse lookups are performed in
* O(log n) time.
* </p>
*
* @see PackIndex
* @see PackFile
*/
public class PackReverseIndex {
  /** Index we were created from, and that has our ObjectId data. */
  private final PackIndex index;

  /** The number of bytes per entry in the offsetIndex. */
  private final long bucketSize;

  /**
   * An index into the nth mapping, where the value is the position after the
   * the last index that contains the values of the bucket. For example given
   * offset o (and bucket = o / bucketSize), the offset will be contained in
   * the range nth[offsetIndex[bucket - 1]] inclusive to
   * nth[offsetIndex[bucket]] exclusive.
   *
   * See {@link #binarySearch}
   */
  private final int[] offsetIndex;

  /** Mapping from indices in offset order to indices in SHA-1 order. */
  private final int[] nth;

  /**
   * Create reverse index from straight/forward pack index, by indexing all
   * its entries.
   *
   * @param packIndex
   *            forward index - entries to (reverse) index.
   */
  public PackReverseIndex(final PackIndex packIndex) {
    index = packIndex;

    final long cnt = index.getObjectCount();
    if (cnt + 1 > Integer.MAX_VALUE)
      throw new IllegalArgumentException(
          JGitText.get().hugeIndexesAreNotSupportedByJgitYet);

    if (cnt == 0) {
      bucketSize = Long.MAX_VALUE;
      offsetIndex = new int[1];
      nth = new int[0];
      return;
    }

    final long[] offsetsBySha1 = new long[(int) cnt];

    long maxOffset = 0;
    int ith = 0;
    for (final MutableEntry me : index) {
      final long o = me.getOffset();
      offsetsBySha1[ith++] = o;
      if (o > maxOffset)
        maxOffset = o;
    }

    bucketSize = maxOffset / cnt + 1;
    int[] bucketIndex = new int[(int) cnt];
    int[] bucketValues = new int[(int) cnt + 1];
    for (int oi = 0; oi < offsetsBySha1.length; oi++) {
      final long o = offsetsBySha1[oi];
      final int bucket = (int) (o / bucketSize);
      final int bucketValuesPos = oi + 1;
      final int current = bucketIndex[bucket];
      bucketIndex[bucket] = bucketValuesPos;
      bucketValues[bucketValuesPos] = current;
    }

    int nthByOffset = 0;
    nth = new int[offsetsBySha1.length];
    offsetIndex = bucketIndex; // Reuse the allocation
    for (int bi = 0; bi < bucketIndex.length; bi++) {
      final int start = nthByOffset;
      // Insertion sort of the values in the bucket.
      for (int vi = bucketIndex[bi]; vi > 0; vi = bucketValues[vi]) {
        final int nthBySha1 = vi - 1;
        final long o = offsetsBySha1[nthBySha1];
        int insertion = nthByOffset++;
        for (; start < insertion; insertion--) {
          if (o > offsetsBySha1[nth[insertion - 1]])
            break;
          nth[insertion] = nth[insertion - 1];
        }
        nth[insertion] = nthBySha1;
      }
      offsetIndex[bi] = nthByOffset;
    }
  }

  /**
   * Search for object id with the specified start offset in this pack
   * (reverse) index.
   *
   * @param offset
   *            start offset of object to find.
   * @return object id for this offset, or null if no object was found.
   */
  public ObjectId findObject(final long offset) {
    final int ith = binarySearch(offset);
    if (ith < 0)
      return null;
    return index.getObjectId(nth[ith]);
  }

  /**
   * Search for the next offset to the specified offset in this pack (reverse)
   * index.
   *
   * @param offset
   *            start offset of previous object (must be valid-existing
   *            offset).
   * @param maxOffset
   *            maximum offset in a pack (returned when there is no next
   *            offset).
   * @return offset of the next object in a pack or maxOffset if provided
   *         offset was the last one.
   * @throws CorruptObjectException
   *             when there is no object with the provided offset.
   */
  public long findNextOffset(final long offset, final long maxOffset)
      throws CorruptObjectException {
    final int ith = binarySearch(offset);
    if (ith < 0)
      throw new CorruptObjectException(
          MessageFormat.format(
              JGitText.get().cantFindObjectInReversePackIndexForTheSpecifiedOffset,
              Long.valueOf(offset)));

    if (ith + 1 == nth.length)
      return maxOffset;
    return index.getOffset(nth[ith + 1]);
  }

  int findPostion(long offset) {
    return binarySearch(offset);
  }

  private int binarySearch(final long offset) {
    int bucket = (int) (offset / bucketSize);
    int low = bucket == 0 ? 0 : offsetIndex[bucket - 1];
    int high = offsetIndex[bucket];
    while (low < high) {
      final int mid = (low + high) >>> 1;
      final long o = index.getOffset(nth[mid]);
      if (offset < o)
        high = mid;
      else if (offset == o)
        return mid;
      else
        low = mid + 1;
    }
    return -1;
  }

  ObjectId findObjectByPosition(int nthPosition) {
    return index.getObjectId(nth[nthPosition]);
  }
}
TOP

Related Classes of org.eclipse.jgit.internal.storage.file.PackReverseIndex

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.