org.apache.flink.util.MathUtils.jenkinsHash java code examples

/**
 * The level parameter is needed so that we can have different hash functions when we recursively apply
 * the partitioning, so that the working set eventually fits into memory.
 */
public static int hash(int code, int level) {
  final int rotation = level * 11;
  code = Integer.rotateLeft(code, rotation);
  return MathUtils.jenkinsHash(code);
}

/**
 * The level parameter is needed so that we can have different hash functions when we recursively apply
 * the partitioning, so that the working set eventually fits into memory.
 */
public static int hash(int code, int level) {
  final int rotation = level * 11;
  code = Integer.rotateLeft(code, rotation);
  return MathUtils.jenkinsHash(code);
}

/**
 * The level parameter is needed so that we can have different hash functions when we recursively apply
 * the partitioning, so that the working set eventually fits into memory.
 */
public static int hash(int code, int level) {
  final int rotation = level * 11;
  code = Integer.rotateLeft(code, rotation);
  return MathUtils.jenkinsHash(code);
}

/**
 * The level parameter is needed so that we can have different hash functions when we recursively apply
 * the partitioning, so that the working set eventually fits into memory.
 */
public static int hash(int code, int level) {
  final int rotation = level * 11;
  code = Integer.rotateLeft(code, rotation);
  return MathUtils.jenkinsHash(code);
}

@Override
public final void insert(T record) throws IOException {
  if (this.closed) {
    return;
  }
  final int hashCode = MathUtils.jenkinsHash(this.buildSideComparator.hash(record));
  final int posHashCode = hashCode % this.numBuckets;
  
  // get the bucket for the given hash code
  final int bucketArrayPos = posHashCode >>> this.bucketsPerSegmentBits;
  final int bucketInSegmentPos = (posHashCode & this.bucketsPerSegmentMask) << NUM_INTRA_BUCKET_BITS;
  final MemorySegment bucket = this.buckets[bucketArrayPos];
  
  // get the basic characteristics of the bucket
  final int partitionNumber = bucket.get(bucketInSegmentPos + HEADER_PARTITION_OFFSET);
  InMemoryPartition<T> partition = this.partitions.get(partitionNumber);
  
  long pointer = insertRecordIntoPartition(record, partition, false);
  insertBucketEntryFromStart(bucket, bucketInSegmentPos, hashCode, pointer, partitionNumber);
}

@Override
public final void insert(T record) throws IOException {
  if (this.closed) {
    return;
  }
  final int hashCode = MathUtils.jenkinsHash(this.buildSideComparator.hash(record));
  final int posHashCode = hashCode % this.numBuckets;
  
  // get the bucket for the given hash code
  final int bucketArrayPos = posHashCode >>> this.bucketsPerSegmentBits;
  final int bucketInSegmentPos = (posHashCode & this.bucketsPerSegmentMask) << NUM_INTRA_BUCKET_BITS;
  final MemorySegment bucket = this.buckets[bucketArrayPos];
  
  // get the basic characteristics of the bucket
  final int partitionNumber = bucket.get(bucketInSegmentPos + HEADER_PARTITION_OFFSET);
  InMemoryPartition<T> partition = this.partitions.get(partitionNumber);
  
  long pointer = insertRecordIntoPartition(record, partition, false);
  insertBucketEntryFromStart(bucket, bucketInSegmentPos, hashCode, pointer, partitionNumber);
}

@Override
public final void insert(T record) throws IOException {
  if (this.closed) {
    return;
  }
  final int hashCode = MathUtils.jenkinsHash(this.buildSideComparator.hash(record));
  final int posHashCode = hashCode % this.numBuckets;
  
  // get the bucket for the given hash code
  final int bucketArrayPos = posHashCode >>> this.bucketsPerSegmentBits;
  final int bucketInSegmentPos = (posHashCode & this.bucketsPerSegmentMask) << NUM_INTRA_BUCKET_BITS;
  final MemorySegment bucket = this.buckets[bucketArrayPos];
  
  // get the basic characteristics of the bucket
  final int partitionNumber = bucket.get(bucketInSegmentPos + HEADER_PARTITION_OFFSET);
  InMemoryPartition<T> partition = this.partitions.get(partitionNumber);
  
  long pointer = insertRecordIntoPartition(record, partition, false);
  insertBucketEntryFromStart(bucket, bucketInSegmentPos, hashCode, pointer, partitionNumber);
}

@Override
public final void insert(T record) throws IOException {
  if (this.closed) {
    return;
  }
  final int hashCode = MathUtils.jenkinsHash(this.buildSideComparator.hash(record));
  final int posHashCode = hashCode % this.numBuckets;
  
  // get the bucket for the given hash code
  final int bucketArrayPos = posHashCode >>> this.bucketsPerSegmentBits;
  final int bucketInSegmentPos = (posHashCode & this.bucketsPerSegmentMask) << NUM_INTRA_BUCKET_BITS;
  final MemorySegment bucket = this.buckets[bucketArrayPos];
  
  // get the basic characteristics of the bucket
  final int partitionNumber = bucket.get(bucketInSegmentPos + HEADER_PARTITION_OFFSET);
  InMemoryPartition<T> partition = this.partitions.get(partitionNumber);
  
  long pointer = insertRecordIntoPartition(record, partition, false);
  insertBucketEntryFromStart(bucket, bucketInSegmentPos, hashCode, pointer, partitionNumber);
}

/**
 * Inserts the given record into the hash table.
 * Note: this method doesn't care about whether a record with the same key is already present.
 * @param record The record to insert.
 * @throws IOException (EOFException specifically, if memory ran out)
 */
@Override
public void insert(T record) throws IOException {
  if (closed) {
    return;
  }
  final int hashCode = MathUtils.jenkinsHash(buildSideComparator.hash(record));
  final int bucket = hashCode & numBucketsMask;
  final int bucketSegmentIndex = bucket >>> numBucketsPerSegmentBits; // which segment contains the bucket
  final MemorySegment bucketSegment = bucketSegments[bucketSegmentIndex];
  final int bucketOffset = (bucket & numBucketsPerSegmentMask) << bucketSizeBits; // offset of the bucket in the segment
  final long firstPointer = bucketSegment.getLong(bucketOffset);
  try {
    final long newFirstPointer = recordArea.appendPointerAndRecord(firstPointer, record);
    bucketSegment.putLong(bucketOffset, newFirstPointer);
  } catch (EOFException ex) {
    compactOrThrow();
    insert(record);
    return;
  }
  numElements++;
  resizeTableIfNecessary();
}

/**
 * Inserts the given record into the hash table.
 * Note: this method doesn't care about whether a record with the same key is already present.
 * @param record The record to insert.
 * @throws IOException (EOFException specifically, if memory ran out)
 */
@Override
public void insert(T record) throws IOException {
  if (closed) {
    return;
  }
  final int hashCode = MathUtils.jenkinsHash(buildSideComparator.hash(record));
  final int bucket = hashCode & numBucketsMask;
  final int bucketSegmentIndex = bucket >>> numBucketsPerSegmentBits; // which segment contains the bucket
  final MemorySegment bucketSegment = bucketSegments[bucketSegmentIndex];
  final int bucketOffset = (bucket & numBucketsPerSegmentMask) << bucketSizeBits; // offset of the bucket in the segment
  final long firstPointer = bucketSegment.getLong(bucketOffset);
  try {
    final long newFirstPointer = recordArea.appendPointerAndRecord(firstPointer, record);
    bucketSegment.putLong(bucketOffset, newFirstPointer);
  } catch (EOFException ex) {
    compactOrThrow();
    insert(record);
    return;
  }
  numElements++;
  resizeTableIfNecessary();
}

/**
 * Inserts the given record into the hash table.
 * Note: this method doesn't care about whether a record with the same key is already present.
 * @param record The record to insert.
 * @throws IOException (EOFException specifically, if memory ran out)
 */
@Override
public void insert(T record) throws IOException {
  if (closed) {
    return;
  }
  final int hashCode = MathUtils.jenkinsHash(buildSideComparator.hash(record));
  final int bucket = hashCode & numBucketsMask;
  final int bucketSegmentIndex = bucket >>> numBucketsPerSegmentBits; // which segment contains the bucket
  final MemorySegment bucketSegment = bucketSegments[bucketSegmentIndex];
  final int bucketOffset = (bucket & numBucketsPerSegmentMask) << bucketSizeBits; // offset of the bucket in the segment
  final long firstPointer = bucketSegment.getLong(bucketOffset);
  try {
    final long newFirstPointer = recordArea.appendPointerAndRecord(firstPointer, record);
    bucketSegment.putLong(bucketOffset, newFirstPointer);
  } catch (EOFException ex) {
    compactOrThrow();
    insert(record);
    return;
  }
  numElements++;
  resizeTableIfNecessary();
}

/**
 * Inserts the given record into the hash table.
 * Note: this method doesn't care about whether a record with the same key is already present.
 * @param record The record to insert.
 * @throws IOException (EOFException specifically, if memory ran out)
 */
@Override
public void insert(T record) throws IOException {
  if (closed) {
    return;
  }
  final int hashCode = MathUtils.jenkinsHash(buildSideComparator.hash(record));
  final int bucket = hashCode & numBucketsMask;
  final int bucketSegmentIndex = bucket >>> numBucketsPerSegmentBits; // which segment contains the bucket
  final MemorySegment bucketSegment = bucketSegments[bucketSegmentIndex];
  final int bucketOffset = (bucket & numBucketsPerSegmentMask) << bucketSizeBits; // offset of the bucket in the segment
  final long firstPointer = bucketSegment.getLong(bucketOffset);
  try {
    final long newFirstPointer = recordArea.appendPointerAndRecord(firstPointer, record);
    bucketSegment.putLong(bucketOffset, newFirstPointer);
  } catch (EOFException ex) {
    compactOrThrow();
    insert(record);
    return;
  }
  numElements++;
  resizeTableIfNecessary();
}

/** Same as above, but the number of bucket segments of the new table can be specified. */
private void rebuild(long newNumBucketSegments) throws IOException {
  // Get new bucket segments
  releaseBucketSegments();
  allocateBucketSegments((int)newNumBucketSegments);
  T record = buildSideSerializer.createInstance();
  try {
    EntryIterator iter = getEntryIterator();
    recordArea.resetAppendPosition();
    recordArea.setWritePosition(0);
    while ((record = iter.next(record)) != null && !closed) {
      final int hashCode = MathUtils.jenkinsHash(buildSideComparator.hash(record));
      final int bucket = hashCode & numBucketsMask;
      final int bucketSegmentIndex = bucket >>> numBucketsPerSegmentBits; // which segment contains the bucket
      final MemorySegment bucketSegment = bucketSegments[bucketSegmentIndex];
      final int bucketOffset = (bucket & numBucketsPerSegmentMask) << bucketSizeBits; // offset of the bucket in the segment
      final long firstPointer = bucketSegment.getLong(bucketOffset);
      long ptrToAppended = recordArea.noSeekAppendPointerAndRecord(firstPointer, record);
      bucketSegment.putLong(bucketOffset, ptrToAppended);
    }
    recordArea.freeSegmentsAfterAppendPosition();
    holes = 0;
  } catch (EOFException ex) {
    throw new RuntimeException("Bug in InPlaceMutableHashTable: we shouldn't get out of memory during a rebuild, " +
      "because we aren't allocating any new memory.");
  }
}

/** Same as above, but the number of bucket segments of the new table can be specified. */
private void rebuild(long newNumBucketSegments) throws IOException {
  // Get new bucket segments
  releaseBucketSegments();
  allocateBucketSegments((int)newNumBucketSegments);
  T record = buildSideSerializer.createInstance();
  try {
    EntryIterator iter = getEntryIterator();
    recordArea.resetAppendPosition();
    recordArea.setWritePosition(0);
    while ((record = iter.next(record)) != null && !closed) {
      final int hashCode = MathUtils.jenkinsHash(buildSideComparator.hash(record));
      final int bucket = hashCode & numBucketsMask;
      final int bucketSegmentIndex = bucket >>> numBucketsPerSegmentBits; // which segment contains the bucket
      final MemorySegment bucketSegment = bucketSegments[bucketSegmentIndex];
      final int bucketOffset = (bucket & numBucketsPerSegmentMask) << bucketSizeBits; // offset of the bucket in the segment
      final long firstPointer = bucketSegment.getLong(bucketOffset);
      long ptrToAppended = recordArea.noSeekAppendPointerAndRecord(firstPointer, record);
      bucketSegment.putLong(bucketOffset, ptrToAppended);
    }
    recordArea.freeSegmentsAfterAppendPosition();
    holes = 0;
  } catch (EOFException ex) {
    throw new RuntimeException("Bug in InPlaceMutableHashTable: we shouldn't get out of memory during a rebuild, " +
      "because we aren't allocating any new memory.");
  }
}

/** Same as above, but the number of bucket segments of the new table can be specified. */
private void rebuild(long newNumBucketSegments) throws IOException {
  // Get new bucket segments
  releaseBucketSegments();
  allocateBucketSegments((int)newNumBucketSegments);
  T record = buildSideSerializer.createInstance();
  try {
    EntryIterator iter = getEntryIterator();
    recordArea.resetAppendPosition();
    recordArea.setWritePosition(0);
    while ((record = iter.next(record)) != null && !closed) {
      final int hashCode = MathUtils.jenkinsHash(buildSideComparator.hash(record));
      final int bucket = hashCode & numBucketsMask;
      final int bucketSegmentIndex = bucket >>> numBucketsPerSegmentBits; // which segment contains the bucket
      final MemorySegment bucketSegment = bucketSegments[bucketSegmentIndex];
      final int bucketOffset = (bucket & numBucketsPerSegmentMask) << bucketSizeBits; // offset of the bucket in the segment
      final long firstPointer = bucketSegment.getLong(bucketOffset);
      long ptrToAppended = recordArea.noSeekAppendPointerAndRecord(firstPointer, record);
      bucketSegment.putLong(bucketOffset, ptrToAppended);
    }
    recordArea.freeSegmentsAfterAppendPosition();
    holes = 0;
  } catch (EOFException ex) {
    throw new RuntimeException("Bug in InPlaceMutableHashTable: we shouldn't get out of memory during a rebuild, " +
      "because we aren't allocating any new memory.");
  }
}

/** Same as above, but the number of bucket segments of the new table can be specified. */
private void rebuild(long newNumBucketSegments) throws IOException {
  // Get new bucket segments
  releaseBucketSegments();
  allocateBucketSegments((int)newNumBucketSegments);
  T record = buildSideSerializer.createInstance();
  try {
    EntryIterator iter = getEntryIterator();
    recordArea.resetAppendPosition();
    recordArea.setWritePosition(0);
    while ((record = iter.next(record)) != null && !closed) {
      final int hashCode = MathUtils.jenkinsHash(buildSideComparator.hash(record));
      final int bucket = hashCode & numBucketsMask;
      final int bucketSegmentIndex = bucket >>> numBucketsPerSegmentBits; // which segment contains the bucket
      final MemorySegment bucketSegment = bucketSegments[bucketSegmentIndex];
      final int bucketOffset = (bucket & numBucketsPerSegmentMask) << bucketSizeBits; // offset of the bucket in the segment
      final long firstPointer = bucketSegment.getLong(bucketOffset);
      long ptrToAppended = recordArea.noSeekAppendPointerAndRecord(firstPointer, record);
      bucketSegment.putLong(bucketOffset, ptrToAppended);
    }
    recordArea.freeSegmentsAfterAppendPosition();
    holes = 0;
  } catch (EOFException ex) {
    throw new RuntimeException("Bug in InPlaceMutableHashTable: we shouldn't get out of memory during a rebuild, " +
      "because we aren't allocating any new memory.");
  }
}

final int searchHashCode = MathUtils.jenkinsHash(this.buildSideComparator.hash(record));
final int posHashCode = searchHashCode % this.numBuckets;

final int searchHashCode = MathUtils.jenkinsHash(this.buildSideComparator.hash(record));
final int posHashCode = searchHashCode % this.numBuckets;

final int searchHashCode = MathUtils.jenkinsHash(this.buildSideComparator.hash(record));
final int posHashCode = searchHashCode % this.numBuckets;

final int searchHashCode = MathUtils.jenkinsHash(this.buildSideComparator.hash(record));
final int posHashCode = searchHashCode % this.numBuckets;

Javadoc

This function hashes an integer value. It is adapted from Bob Jenkins' website http://www.burtleburtle.net/bob/hash/integer.html. The hash function has the full avalanche property, meaning that every bit of the value to be hashed affects every bit of the hash value.

It is crucial to use different hash functions to partition data across machines and the internal partitioning of data structures. This hash function is intended for partitioning internally in data structures.

Popular methods of MathUtils

checkedDownCast
Casts the given value to a 32 bit integer, if it can be safely done. If the cast would change the nu
log2strict
Computes the logarithm of the given value to the base of 2. This method throws an error, if the give
murmurHash
This function hashes an integer value.It is crucial to use different hash functions to partition dat
bitMix
Bit-mixing for pseudo-randomization of integers (e.g., to guard against bad hash functions). Impleme
isPowerOf2
Checks whether the given value is a power of two.
roundDownToPowerOf2
Decrements the given number down to the closest power of two. If the argument is a power of two, it
roundUpToPowerOfTwo
Round the given number to the next power of two.
longToIntWithBitMixing
Pseudo-randomly maps a long (64-bit) to an integer (32-bit) using some bit-mixing for better distrib
flipSignBit
Flips the sign bit (most-significant-bit) of the input.
log2floor
Computes the logarithm of the given value to the base of 2, rounded down. It corresponds to the posi

Popular in Java

Start an intent from android
scheduleAtFixedRate (ScheduledExecutorService)
setRequestProperty (URLConnection)
requestLocationUpdates (LocationManager)
Stack (java.util)
Stack is a Last-In/First-Out(LIFO) data structure which represents a stack of objects. It enables u
StringUtils (org.apache.commons.lang)
Operations on java.lang.String that arenull safe. * IsEmpty/IsBlank - checks if a String contains
Rectangle (java.awt)
A Rectangle specifies an area in a coordinate space that is enclosed by the Rectangle object's top-
BoxLayout (javax.swing)
Loader (org.hibernate.loader)
Abstract superclass of object loading (and querying) strategies. This class implements useful common
Join (org.hibernate.mapping)
Top PhpStorm plugins

How to use jenkinsHashmethodin org.apache.flink.util.MathUtils

Best Java code snippets using org.apache.flink.util.MathUtils.jenkinsHash (Showing top 20 results out of 315)

How to use
jenkinsHash
method
in
org.apache.flink.util.MathUtils