/*
 * Copyright (C) 2008, Shawn O. Pearce <spearce@spearce.org>
 * and other copyright owners as documented in the project's IP log.
 *
 * This program and the accompanying materials are made available
 * under the terms of the Eclipse Distribution License v1.0 which
 * accompanies this distribution, is reproduced below, and is
 * available at http://www.eclipse.org/org/documents/edl-v10.php
 *
 * All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or
 * without modification, are permitted provided that the following
 * conditions are met:
 *
 * - Redistributions of source code must retain the above copyright
 *   notice, this list of conditions and the following disclaimer.
 *
 * - Redistributions in binary form must reproduce the above
 *   copyright notice, this list of conditions and the following
 *   disclaimer in the documentation and/or other materials provided
 *   with the distribution.
 *
 * - Neither the name of the Eclipse Foundation, Inc. nor the
 *   names of its contributors may be used to endorse or promote
 *   products derived from this software without specific prior
 *   written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
 * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
 * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
 * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
 * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
 * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */

package org.eclipse.jgit.internal.storage.file;

import java.io.IOException;
import java.io.InputStream;
import java.text.MessageFormat;
import java.util.Arrays;
import java.util.Iterator;
import java.util.NoSuchElementException;
import java.util.Set;

import org.eclipse.jgit.errors.MissingObjectException;
import org.eclipse.jgit.internal.JGitText;
import org.eclipse.jgit.lib.AbbreviatedObjectId;
import org.eclipse.jgit.lib.AnyObjectId;
import org.eclipse.jgit.lib.Constants;
import org.eclipse.jgit.lib.ObjectId;
import org.eclipse.jgit.util.IO;
import org.eclipse.jgit.util.NB;

Support for the pack index v2 format.
/** Support for the pack index v2 format. */
class PackIndexV2 extends PackIndex { private static final long IS_O64 = 1L << 31; private static final int FANOUT = 256; private static final int[] NO_INTS = {}; private static final byte[] NO_BYTES = {}; private long objectCnt; private final long[] fanoutTable;
256 arrays of contiguous object names.
/** 256 arrays of contiguous object names. */
int[][] names;
256 arrays of the 32 bit offset data, matching names.
/** 256 arrays of the 32 bit offset data, matching {@link #names}. */
byte[][] offset32;
256 arrays of the CRC-32 of objects, matching names.
/** 256 arrays of the CRC-32 of objects, matching {@link #names}. */
private byte[][] crc32;
64 bit offset table.
/** 64 bit offset table. */
byte[] offset64; PackIndexV2(final InputStream fd) throws IOException { final byte[] fanoutRaw = new byte[4 * FANOUT]; IO.readFully(fd, fanoutRaw, 0, fanoutRaw.length); fanoutTable = new long[FANOUT]; for (int k = 0; k < FANOUT; k++) fanoutTable[k] = NB.decodeUInt32(fanoutRaw, k * 4); objectCnt = fanoutTable[FANOUT - 1]; names = new int[FANOUT][]; offset32 = new byte[FANOUT][]; crc32 = new byte[FANOUT][]; // Object name table. The size we can permit per fan-out bucket // is limited to Java's 2 GB per byte array limitation. That is // no more than 107,374,182 objects per fan-out. // for (int k = 0; k < FANOUT; k++) { final long bucketCnt; if (k == 0) bucketCnt = fanoutTable[k]; else bucketCnt = fanoutTable[k] - fanoutTable[k - 1]; if (bucketCnt == 0) { names[k] = NO_INTS; offset32[k] = NO_BYTES; crc32[k] = NO_BYTES; continue; } else if (bucketCnt < 0) throw new IOException(MessageFormat.format( JGitText.get().indexFileCorruptedNegativeBucketCount, Long.valueOf(bucketCnt))); final long nameLen = bucketCnt * Constants.OBJECT_ID_LENGTH; if (nameLen > Integer.MAX_VALUE - 8) // see http://stackoverflow.com/a/8381338 throw new IOException(JGitText.get().indexFileIsTooLargeForJgit); final int intNameLen = (int) nameLen; final byte[] raw = new byte[intNameLen]; final int[] bin = new int[intNameLen >>> 2]; IO.readFully(fd, raw, 0, raw.length); for (int i = 0; i < bin.length; i++) bin[i] = NB.decodeInt32(raw, i << 2); names[k] = bin; offset32[k] = new byte[(int) (bucketCnt * 4)]; crc32[k] = new byte[(int) (bucketCnt * 4)]; } // CRC32 table. for (int k = 0; k < FANOUT; k++) IO.readFully(fd, crc32[k], 0, crc32[k].length); // 32 bit offset table. Any entries with the most significant bit // set require a 64 bit offset entry in another table. // int o64cnt = 0; for (int k = 0; k < FANOUT; k++) { final byte[] ofs = offset32[k]; IO.readFully(fd, ofs, 0, ofs.length); for (int p = 0; p < ofs.length; p += 4) if (ofs[p] < 0) o64cnt++; } // 64 bit offset table. Most objects should not require an entry. // if (o64cnt > 0) { offset64 = new byte[o64cnt * 8]; IO.readFully(fd, offset64, 0, offset64.length); } else { offset64 = NO_BYTES; } packChecksum = new byte[20]; IO.readFully(fd, packChecksum, 0, packChecksum.length); }
{@inheritDoc}
/** {@inheritDoc} */
@Override public long getObjectCount() { return objectCnt; }
{@inheritDoc}
/** {@inheritDoc} */
@Override public long getOffset64Count() { return offset64.length / 8; } private int findLevelOne(long nthPosition) { int levelOne = Arrays.binarySearch(fanoutTable, nthPosition + 1); if (levelOne >= 0) { // If we hit the bucket exactly the item is in the bucket, or // any bucket before it which has the same object count. // long base = fanoutTable[levelOne]; while (levelOne > 0 && base == fanoutTable[levelOne - 1]) levelOne--; } else { // The item is in the bucket we would insert it into. // levelOne = -(levelOne + 1); } return levelOne; } private int getLevelTwo(long nthPosition, int levelOne) { final long base = levelOne > 0 ? fanoutTable[levelOne - 1] : 0; return (int) (nthPosition - base); }
{@inheritDoc}
/** {@inheritDoc} */
@Override public ObjectId getObjectId(long nthPosition) { final int levelOne = findLevelOne(nthPosition); final int p = getLevelTwo(nthPosition, levelOne); final int p4 = p << 2; return ObjectId.fromRaw(names[levelOne], p4 + p); // p * 5 }
{@inheritDoc}
/** {@inheritDoc} */
@Override public long getOffset(long nthPosition) { final int levelOne = findLevelOne(nthPosition); final int levelTwo = getLevelTwo(nthPosition, levelOne); return getOffset(levelOne, levelTwo); }
{@inheritDoc}
/** {@inheritDoc} */
@Override public long findOffset(AnyObjectId objId) { final int levelOne = objId.getFirstByte(); final int levelTwo = binarySearchLevelTwo(objId, levelOne); if (levelTwo == -1) return -1; return getOffset(levelOne, levelTwo); } private long getOffset(int levelOne, int levelTwo) { final long p = NB.decodeUInt32(offset32[levelOne], levelTwo << 2); if ((p & IS_O64) != 0) return NB.decodeUInt64(offset64, (8 * (int) (p & ~IS_O64))); return p; }
{@inheritDoc}
/** {@inheritDoc} */
@Override public long findCRC32(AnyObjectId objId) throws MissingObjectException { final int levelOne = objId.getFirstByte(); final int levelTwo = binarySearchLevelTwo(objId, levelOne); if (levelTwo == -1) throw new MissingObjectException(objId.copy(), "unknown"); //$NON-NLS-1$ return NB.decodeUInt32(crc32[levelOne], levelTwo << 2); }
{@inheritDoc}
/** {@inheritDoc} */
@Override public boolean hasCRC32Support() { return true; }
{@inheritDoc}
/** {@inheritDoc} */
@Override public Iterator<MutableEntry> iterator() { return new EntriesIteratorV2(); }
{@inheritDoc}
/** {@inheritDoc} */
@Override public void resolve(Set<ObjectId> matches, AbbreviatedObjectId id, int matchLimit) throws IOException { int[] data = names[id.getFirstByte()]; int max = offset32[id.getFirstByte()].length >>> 2; int high = max; if (high == 0) return; int low = 0; do { int p = (low + high) >>> 1; final int cmp = id.prefixCompare(data, idOffset(p)); if (cmp < 0) high = p; else if (cmp == 0) { // We may have landed in the middle of the matches. Move // backwards to the start of matches, then walk forwards. // while (0 < p && id.prefixCompare(data, idOffset(p - 1)) == 0) p--; for (; p < max && id.prefixCompare(data, idOffset(p)) == 0; p++) { matches.add(ObjectId.fromRaw(data, idOffset(p))); if (matches.size() > matchLimit) break; } return; } else low = p + 1; } while (low < high); } private static int idOffset(int p) { return (p << 2) + p; // p * 5 } private int binarySearchLevelTwo(AnyObjectId objId, int levelOne) { final int[] data = names[levelOne]; int high = offset32[levelOne].length >>> 2; if (high == 0) return -1; int low = 0; do { final int mid = (low + high) >>> 1; final int mid4 = mid << 2; final int cmp; cmp = objId.compareTo(data, mid4 + mid); // mid * 5 if (cmp < 0) high = mid; else if (cmp == 0) { return mid; } else low = mid + 1; } while (low < high); return -1; } private class EntriesIteratorV2 extends EntriesIterator { int levelOne; int levelTwo; @Override protected MutableEntry initEntry() { return new MutableEntry() { @Override protected void ensureId() { idBuffer.fromRaw(names[levelOne], levelTwo - Constants.OBJECT_ID_LENGTH / 4); } }; } @Override public MutableEntry next() { for (; levelOne < names.length; levelOne++) { if (levelTwo < names[levelOne].length) { int idx = levelTwo / (Constants.OBJECT_ID_LENGTH / 4) * 4; long offset = NB.decodeUInt32(offset32[levelOne], idx); if ((offset & IS_O64) != 0) { idx = (8 * (int) (offset & ~IS_O64)); offset = NB.decodeUInt64(offset64, idx); } entry.offset = offset; levelTwo += Constants.OBJECT_ID_LENGTH / 4; returnedNumber++; return entry; } levelTwo = 0; } throw new NoSuchElementException(); } } }