/* * CDDL HEADER START * * The contents of this file are subject to the terms of the * Common Development and Distribution License, Version 1.0 only * (the "License"). You may not use this file except in compliance * with the License. * * You can obtain a copy of the license at legal-notices/CDDLv1_0.txt * or http://forgerock.org/license/CDDLv1.0.html. * See the License for the specific language governing permissions * and limitations under the License. * * When distributing Covered Code, include this CDDL HEADER in each * file and include the License file at legal-notices/CDDLv1_0.txt. * If applicable, add the following below this CDDL HEADER, with the * fields enclosed by brackets "[]" replaced with your own identifying * information: * Portions Copyright [yyyy] [name of copyright owner] * * CDDL HEADER END * * * Copyright 2009-2010 Sun Microsystems, Inc. * Portions Copyright 2013-2015 ForgeRock AS. */ package org.opends.server.backends.pluggable; import static org.opends.server.backends.pluggable.Importer.indexComparator; import java.io.ByteArrayOutputStream; import java.io.DataOutputStream; import java.io.IOException; import org.forgerock.opendj.ldap.ByteSequence; import org.forgerock.opendj.ldap.ByteStringBuilder; /** * This class represents a index buffer used to store the keys and entry IDs * processed from the LDIF file during phase one of an import, or rebuild index * process. Each key and ID is stored in a record in the buffer. *

* The records in the buffer are eventually sorted, based on the key, when the * maximum size of the buffer is reached and no more records will fit into the * buffer. The buffer is scheduled to be flushed to an index scratch file and * then re-cycled by the import, or rebuild-index process. *

* The structure of a record in the buffer is the following: * *

 * +-------------+-------------+---------+---------+------------+-----------+
 * | record size | INS/DEL bit | indexID | entryID | key length | key bytes |
 * +-------------+-------------+---------+---------+------------+-----------+
 *

* * The record size is used for fast seeks to quickly "jump" over records. *

* The records are packed as much as possible, to optimize the buffer space. *

* This class is not thread safe. *

*/ final class IndexOutputBuffer implements Comparable { /** The number of bytes of a Java int. */ static final int INT_SIZE = 4; /** The number of bytes of a Java long. */ static final int LONG_SIZE = 8; /** * The record overhead. In addition to entryID, key length and key bytes, the * record overhead includes the INS/DEL bit + indexID */ private static final int REC_OVERHEAD = 1 + INT_SIZE; /** Buffer records are either insert records or delete records. */ private static final byte DEL = 0, INS = 1; /** The size of a buffer. */ private final int size; /** Byte array holding the actual buffer data. */ private final byte buffer[]; /** * Used to break a tie (keys equal) when the buffers are being merged * for writing to the index scratch file. */ private long bufferID; /** OffSet where next key is written. */ private int keyOffset; /** OffSet where next value record is written. */ private int recordOffset; /** Amount of bytes left in the buffer. */ private int bytesLeft; /** Number of keys in the buffer. */ private int keys; /** Used to iterate over the buffer when writing to a scratch file. */ private int position; /** * Used to make sure that an instance of this class is put on the * correct scratch file writer work queue for processing. */ private Importer.IndexKey indexKey; /** Initial capacity of re-usable buffer used in key compares. */ private static final int CAP = 32; /** * This buffer is reused during key compares. It's main purpose is to keep * memory footprint as small as possible. */ private ByteStringBuilder keyBuffer = new ByteStringBuilder(CAP); /** * Set to {@code true} if the buffer should not be recycled. Used when the * importer/rebuild index process is doing phase one cleanup and flushing * buffers not completed. */ private boolean discarded; /** * Create an instance of a IndexBuffer using the specified size. * * @param size The size of the underlying byte array. */ public IndexOutputBuffer(int size) { this.size = size; this.buffer = new byte[size]; this.bytesLeft = size; this.recordOffset = size - 1; } /** * Reset an IndexBuffer so it can be re-cycled. */ public void reset() { bytesLeft = size; keyOffset = 0; recordOffset = size - 1; keys = 0; position = 0; indexKey = null; } /** * Creates a new poison buffer. Poison buffers are used to stop the processing of import tasks. * * @return a new poison buffer */ public static IndexOutputBuffer poison() { return new IndexOutputBuffer(0); } /** * Set the ID of a buffer to the specified value. * * @param bufferID The value to set the buffer ID to. */ public void setBufferID(long bufferID) { this.bufferID = bufferID; } /** * Return the ID of a buffer. * * @return The value of a buffer's ID. */ private long getBufferID() { return this.bufferID; } /** * Determines if a buffer is a poison buffer. A poison buffer is used to * shutdown work queues when import/rebuild index phase one is completed. * A poison buffer has a 0 size. * * @return {@code true} if a buffer is a poison buffer, or {@code false} * otherwise. */ public boolean isPoison() { return size == 0; } /** * Determines if buffer should be re-cycled by calling {@link #reset()}. * * @return {@code true} if buffer should be recycled, or {@code false} if it should not. */ boolean isDiscarded() { return discarded; } /** * Sets the discarded flag to {@code true}. */ public void discard() { discarded = true; } /** * Returns {@code true} if there is enough space available to write the * specified byte array in the buffer. It returns {@code false} otherwise. * * @param kBytes The byte array to check space against. * @param entryID The entryID value to check space against. * @return {@code true} if there is space to write the byte array in a * buffer, or {@code false} otherwise. */ public boolean isSpaceAvailable(ByteSequence kBytes, long entryID) { return getRequiredSize(kBytes.length(), entryID) < bytesLeft; } /** * Return a buffer's current position value. * * @return The buffer's current position value. */ public int getPosition() { return position; } /** * Set a buffer's position value to the specified position. * * @param position The value to set the position to. */ public void setPosition(int position) { this.position = position; } /** * Sort the buffer. */ public void sort() { sort(0, keys); } /** * Add the specified key byte array and EntryID to the buffer. * * @param keyBytes The key byte array. * @param entryID The EntryID. * @param indexID The index ID the record belongs. * @param insert True if key is an insert, false otherwise. */ public void add(ByteSequence keyBytes, EntryID entryID, int indexID, boolean insert) { // write the record data, but leave the space to write the record size just // before it recordOffset = addRecord(keyBytes, entryID.longValue(), indexID, insert); // then write the returned record size keyOffset = writeInt(buffer, keyOffset, recordOffset); bytesLeft = recordOffset - keyOffset; keys++; } /** * Writes the full record minus the record size itself. */ private int addRecord(ByteSequence key, long entryID, int indexID, boolean insert) { int retOffset = recordOffset - getRecordSize(key.length()); int offSet = retOffset; // write the INS/DEL bit buffer[offSet++] = insert ? INS : DEL; // write the indexID offSet = writeInt(buffer, offSet, indexID); // write the entryID offSet = writeLong(buffer, offSet, entryID); // write the key length offSet = writeInt(buffer, offSet, key.length()); // write the key bytes key.copyTo(buffer, offSet); return retOffset; } /** * Computes the full size of the record. * * @param keyLen The length of the key of index * @param entryID The entry id * @return The size that such record would take in the IndexOutputBuffer */ public static int getRequiredSize(int keyLen, long entryID) { // also add up the space needed to store the record size return getRecordSize(keyLen) + INT_SIZE; } private static int getRecordSize(int keyLen) { // Adds up (INS/DEL bit + indexID) + entryID + key length + key bytes return REC_OVERHEAD + LONG_SIZE + INT_SIZE + keyLen; } /** * Write the entryID at the specified position to the specified output stream. * Used when writing the index scratch files. * * @param stream The stream to write the record at the index to. * @param position The position of the record to write. */ public void writeEntryID(ByteArrayOutputStream stream, int position) { int offSet = getOffset(position); stream.write(buffer, offSet + REC_OVERHEAD, LONG_SIZE); } /** * Return {@code true} if the record specified by the position is an insert * record, or {@code false} if it a delete record. * * @param position The position of the record. * @return {@code true} if the record is an insert record, or {@code false} * if it is a delete record. */ public boolean isInsertRecord(int position) { int recOffset = getOffset(position); return buffer[recOffset] == INS; } /** * Return the size of the key part of the record. * * @return The size of the key part of the record. */ public int getKeySize() { int offSet = getOffset(position) + REC_OVERHEAD + LONG_SIZE; return readInt(buffer, offSet); } /** * Return the key value part of a record indicated by the current buffer * position. * * @return byte array containing the key value. */ public byte[] getKey() { return getKey(position); } /** Used to minimized memory usage when comparing keys. */ private ByteStringBuilder getKeyBuf(int position) { keyBuffer.clear(); int offSet = getOffset(position) + REC_OVERHEAD + LONG_SIZE; int keyLen = readInt(buffer, offSet); offSet += INT_SIZE; keyBuffer.append(buffer, offSet, keyLen); return keyBuffer; } /** * Return the key value part of a record specified by the index. * * @param position position to return. * @return byte array containing the key value. */ private byte[] getKey(int position) { int offSet = getOffset(position) + REC_OVERHEAD + LONG_SIZE; int keyLen = readInt(buffer, offSet); offSet += INT_SIZE; byte[] key = new byte[keyLen]; System.arraycopy(buffer, offSet, key, 0, keyLen); return key; } private int getOffset(int position) { return readInt(position * INT_SIZE); } /** * Return index id associated with the current position's record. * * @return The index id. */ public int getIndexID() { return getIndexID(position); } private int getIndexID(int position) { return getIndexIDFromOffset(getOffset(position)); } private int getIndexIDFromOffset(int offset) { return readInt(offset + 1); } private int compare(int xPosition, int yPosition) { int xoffSet = getOffset(xPosition); int xIndexID = getIndexIDFromOffset(xoffSet); xoffSet += REC_OVERHEAD + LONG_SIZE; int xKeyLen = readInt(buffer, xoffSet); int xKey = INT_SIZE + xoffSet; int yoffSet = getOffset(yPosition); int yIndexID = getIndexIDFromOffset(yoffSet); yoffSet += REC_OVERHEAD + LONG_SIZE; int yKeyLen = readInt(buffer, yoffSet); int yKey = INT_SIZE + yoffSet; return indexComparator.compare(buffer, xKey, xKeyLen, xIndexID, buffer, yKey, yKeyLen, yIndexID); } private int compare(int xPosition, byte[] yKey, int yIndexID) { int xoffSet = getOffset(xPosition); int xIndexID = getIndexIDFromOffset(xoffSet); xoffSet += REC_OVERHEAD + LONG_SIZE; int xKeyLen = readInt(buffer, xoffSet); int xKey = INT_SIZE + xoffSet; return indexComparator.compare(buffer, xKey, xKeyLen, xIndexID, yKey, 0, yKey.length, yIndexID); } /** * Verifies whether the provided byte array and indexID are equal to * the byte array and indexIDs currently pointed to by this index output buffer. * * @param b The byte array to compare. * @param bIndexID The index key to compare. * @return True if the byte arrays are equal. */ public boolean sameKeyAndIndexID(byte[] b, int bIndexID) { if (b == null) { return false; } int offset = getOffset(position); int indexID = getIndexIDFromOffset(offset); offset += REC_OVERHEAD + LONG_SIZE; int keyLen = readInt(buffer, offset); int key = INT_SIZE + offset; return indexComparator.compare(buffer, key, keyLen, b, b.length) == 0 && indexID == bIndexID; } /** * Compare current IndexBuffer to the specified index buffer using both the * comparator and index ID of both buffers. * * The key at the value of position in both buffers are used in the compare. * * @param b The IndexBuffer to compare to. * @return 0 if the buffers are equal, -1 if the current buffer is less * than the specified buffer, or 1 if it is greater. */ @Override public int compareTo(IndexOutputBuffer b) { final ByteStringBuilder keyBuf = b.getKeyBuf(b.position); int offset = getOffset(position); int indexID = getIndexIDFromOffset(offset); offset += REC_OVERHEAD + LONG_SIZE; int keyLen = readInt(buffer, offset); int key = INT_SIZE + offset; int cmp = indexComparator.compare(buffer, key, keyLen, keyBuf.getBackingArray(), keyBuf.length()); if (cmp == 0) { cmp = compareInts(indexID, b.getIndexID()); if (cmp == 0) { // This is tested in a tree set remove when a buffer is removed from the tree set. return compareLongs(bufferID, b.getBufferID()); } } return cmp; } private static int compareLongs(long l1, long l2) { if (l1 == l2) { return 0; } else if (l1 < l2) { return -1; } else { return 1; } } /** * Write a record to specified output stream using the record pointed to by * the current position and the specified byte stream of ids. * * @param dataStream The data output stream to write to. * * @throws IOException If an I/O error occurs writing the record. */ public void writeKey(DataOutputStream dataStream) throws IOException { int offSet = getOffset(position) + REC_OVERHEAD + LONG_SIZE; int keyLen = readInt(buffer, offSet); offSet += INT_SIZE; dataStream.write(buffer, offSet, keyLen); } /** * Compare the byte array at the current position with the byte array at the * provided position. * * @param position The index pointing to the byte array to compare. * @return {@code true} if the byte arrays are equal, or {@code false} otherwise */ public boolean sameKeyAndIndexID(int position) { return compare(position, this.position) == 0; } /** * Return the current number of keys. * * @return The number of keys currently in an index buffer. */ public int getNumberKeys() { return keys; } /** * Return {@code true} if the buffer has more data to process, or * {@code false} otherwise. Used when iterating over the buffer writing the * scratch index file. * * @return {@code true} if a buffer has more data to process, or * {@code false} otherwise. */ public boolean hasMoreData() { return position + 1 < keys; } /** * Advance the position pointer to the next record in the buffer. Used when * iterating over the buffer examining keys. */ public void nextRecord() { position++; } private int writeInt(byte[] buffer, int offset, int val) { final int endOffset = offset + INT_SIZE; for (int i = endOffset - 1; i >= offset; i--) { buffer[i] = (byte) (val & 0xff); val >>>= 8; } return endOffset; } private int writeLong(byte[] buffer, int offset, long val) { final int endOffset = offset + LONG_SIZE; for (int i = endOffset - 1; i >= offset; i--) { buffer[i] = (byte) (val & 0xff); val >>>= 8; } return endOffset; } private int readInt(int index) { return readInt(buffer, index); } private int readInt(byte[] buffer, int index) { int answer = 0; for (int i = 0; i < INT_SIZE; i++) { byte b = buffer[index + i]; answer <<= 8; answer |= (b & 0xff); } return answer; } private int med3(int a, int b, int c) { return compare(a,b) < 0 ? (compare(b,c) < 0 ? b : compare(a,c) < 0 ? c : a) : (compare(b,c) > 0 ? b : compare(a,c) > 0 ? c : a); } private void sort(int off, int len) { if (len < 7) { for (int i=off; ioff && compare(j-1, j)>0; j--) { swap(j, j-1); } } return; } int m = off + (len >> 1); if (len > 7) { int l = off; int n = off + len - 1; if (len > 40) { int s = len/8; l = med3(l, l+s, l+2*s); m = med3(m-s, m, m+s); n = med3(n-2*s, n-s, n); } m = med3(l, m, n); } byte[] mKey = getKey(m); int mIndexID = getIndexID(m); int a = off, b = a, c = off + len - 1, d = c; while(true) { while (b <= c && compare(b, mKey, mIndexID) <= 0) { if (compare(b, mKey, mIndexID) == 0) { swap(a++, b); } b++; } while (c >= b && compare(c, mKey, mIndexID) >= 0) { if (compare(c, mKey, mIndexID) == 0) { swap(c, d--); } c--; } if (b > c) { break; } swap(b++, c--); } // Swap partition elements back to middle int s, n = off + len; s = Math.min(a-off, b-a ); vectorSwap(off, b-s, s); s = Math.min(d-c, n-d-1); vectorSwap(b, n-s, s); s = b - a; // Recursively sort non-partition-elements if (s > 1) { sort(off, s); } s = d - c; if (s > 1) { sort(n-s, s); } } private void swap(int a, int b) { int aOffset = a * INT_SIZE; int bOffset = b * INT_SIZE; int bVal = readInt(bOffset); System.arraycopy(buffer, aOffset, buffer, bOffset, INT_SIZE); writeInt(buffer, aOffset, bVal); } private void vectorSwap(int a, int b, int n) { for (int i=0; i * The Comparator interface cannot be used in this class, so this * special one is used that knows about the special properties of this class. */ public static class IndexComparator { /** * Compare an offset in a byte array and indexID with the specified offset in the other byte array * and other indexID, using the DN compare algorithm. * * @param array1 The first byte array. * @param offset1 The first byte array's offset. * @param length1 The first byte array's length. * @param indexID1 The first index id. * @param array2 The second byte array to compare to. * @param offset1 The second byte array's offset. * @param length2 The second byte array's length. * @param indexID2 The second index id. * @return a negative integer, zero, or a positive integer as the first * offset value is less than, equal to, or greater than the second * byte array. */ private int compare(byte[] array1, int offset1, int length1, int indexID1, byte[] array2, int offset2, int length2, int indexID2) { int cmp = compareArrays(array1, offset1, length1, array2, offset2, length2); if (cmp == 0) { cmp = compareInts(length1, length2); if (cmp == 0) { return compareInts(indexID1, indexID2); } } return cmp; } int compare(ByteStringBuilder key1, ByteStringBuilder key2) { return compare(key1.getBackingArray(), 0, key1.length(), key2.getBackingArray(), key2.length()); } /** * Compare an offset in an byte array with the specified byte array, * using the DN compare algorithm. * * @param b The byte array. * @param offset The first offset. * @param length The first length. * @param other The second byte array to compare to. * @param otherLength The second byte array's length. * @return a negative integer, zero, or a positive integer as the first * offset value is less than, equal to, or greater than the second * byte array. */ int compare(byte[] b, int offset, int length, byte[] other, int otherLength) { int cmp = compareArrays(b, offset, length, other, 0, otherLength); if (cmp == 0) { return compareInts(length, otherLength); } return cmp; } private int compareArrays(byte[] array1, int offset1, int length1, byte[] array2, int offset2, int length2) { for (int i = 0; i < length1 && i < length2; i++) { byte b1 = array1[offset1 + i]; byte b2 = array2[offset2 + i]; if (b1 > b2) { return 1; } else if (b1 < b2) { return -1; } } return 0; } } private static int compareInts(int i1, int i2) { if (i1 == i2) { return 0; } else if (i1 > i2) { return 1; } else { return -1; } } /** * Set the index key associated with an index buffer. * * @param indexKey The index key. */ public void setIndexKey(Importer.IndexKey indexKey) { this.indexKey = indexKey; } /** * Return the index key of an index buffer. * @return The index buffer's index key. */ public Importer.IndexKey getIndexKey() { return indexKey; } }