org.apache.spark.util.sketch.Murmur3_x86_32 java code examples

public static int hashLong(long input, int seed) {
 int low = (int) input;
 int high = (int) (input >>> 32);
 int k1 = mixK1(low);
 int h1 = mixH1(seed, k1);
 k1 = mixK1(high);
 h1 = mixH1(h1, k1);
 return fmix(h1, 8);
}

public static int hashUnsafeBytes(Object base, long offset, int lengthInBytes, int seed) {
 assert (lengthInBytes >= 0): "lengthInBytes cannot be negative";
 int lengthAligned = lengthInBytes - lengthInBytes % 4;
 int h1 = hashBytesByInt(base, offset, lengthAligned, seed);
 for (int i = lengthAligned; i < lengthInBytes; i++) {
  int halfWord = Platform.getByte(base, offset + i);
  int k1 = mixK1(halfWord);
  h1 = mixH1(h1, k1);
 }
 return fmix(h1, lengthInBytes);
}

public int hashInt(int input) {
 return hashInt(input, seed);
}

public static int hashUnsafeWords(Object base, long offset, int lengthInBytes, int seed) {
 // This is based on Guava's `Murmur32_Hasher.processRemaining(ByteBuffer)` method.
 assert (lengthInBytes % 8 == 0): "lengthInBytes must be a multiple of 8 (word-aligned)";
 int h1 = hashBytesByInt(base, offset, lengthInBytes, seed);
 return fmix(h1, lengthInBytes);
}

public static int hashUnsafeBytes2(Object base, long offset, int lengthInBytes, int seed) {
 // This is compatible with original and another implementations.
 // Use this method for new components after Spark 2.3.
 assert (lengthInBytes >= 0): "lengthInBytes cannot be negative";
 int lengthAligned = lengthInBytes - lengthInBytes % 4;
 int h1 = hashBytesByInt(base, offset, lengthAligned, seed);
 int k1 = 0;
 for (int i = lengthAligned, shift = 0; i < lengthInBytes; i++, shift += 8) {
  k1 ^= (Platform.getByte(base, offset + i) & 0xFF) << shift;
 }
 h1 ^= mixK1(k1);
 return fmix(h1, lengthInBytes);
}

private static int hashBytesByInt(Object base, long offset, int lengthInBytes, int seed) {
 assert (lengthInBytes % 4 == 0);
 int h1 = seed;
 for (int i = 0; i < lengthInBytes; i += 4) {
  int halfWord = Platform.getInt(base, offset + i);
  int k1 = mixK1(halfWord);
  h1 = mixH1(h1, k1);
 }
 return h1;
}

private static int[] getHashBuckets(byte[] b, int hashCount, int max) {
 int[] result = new int[hashCount];
 int hash1 = Murmur3_x86_32.hashUnsafeBytes(b, Platform.BYTE_ARRAY_OFFSET, b.length, 0);
 int hash2 = Murmur3_x86_32.hashUnsafeBytes(b, Platform.BYTE_ARRAY_OFFSET, b.length, hash1);
 for (int i = 0; i < hashCount; i++) {
  result[i] = Math.abs((hash1 + i * hash2) % max);
 }
 return result;
}

public int hashLong(long input) {
 return hashLong(input, seed);
}

public int hashUnsafeWords(Object base, long offset, int lengthInBytes) {
 return hashUnsafeWords(base, offset, lengthInBytes, seed);
}

public static int hashUnsafeBytes2(Object base, long offset, int lengthInBytes, int seed) {
 // This is compatible with original and another implementations.
 // Use this method for new components after Spark 2.3.
 assert (lengthInBytes >= 0): "lengthInBytes cannot be negative";
 int lengthAligned = lengthInBytes - lengthInBytes % 4;
 int h1 = hashBytesByInt(base, offset, lengthAligned, seed);
 int k1 = 0;
 for (int i = lengthAligned, shift = 0; i < lengthInBytes; i++, shift += 8) {
  k1 ^= (Platform.getByte(base, offset + i) & 0xFF) << shift;
 }
 h1 ^= mixK1(k1);
 return fmix(h1, lengthInBytes);
}

public static int hashUnsafeWords(Object base, long offset, int lengthInBytes, int seed) {
 // This is based on Guava's `Murmur32_Hasher.processRemaining(ByteBuffer)` method.
 assert (lengthInBytes % 8 == 0): "lengthInBytes must be a multiple of 8 (word-aligned)";
 int h1 = hashBytesByInt(base, offset, lengthInBytes, seed);
 return fmix(h1, lengthInBytes);
}

private static int hashBytesByInt(Object base, long offset, int lengthInBytes, int seed) {
 assert (lengthInBytes % 4 == 0);
 int h1 = seed;
 for (int i = 0; i < lengthInBytes; i += 4) {
  int halfWord = Platform.getInt(base, offset + i);
  int k1 = mixK1(halfWord);
  h1 = mixH1(h1, k1);
 }
 return h1;
}

private static int[] getHashBuckets(byte[] b, int hashCount, int max) {
 int[] result = new int[hashCount];
 int hash1 = Murmur3_x86_32.hashUnsafeBytes(b, Platform.BYTE_ARRAY_OFFSET, b.length, 0);
 int hash2 = Murmur3_x86_32.hashUnsafeBytes(b, Platform.BYTE_ARRAY_OFFSET, b.length, hash1);
 for (int i = 0; i < hashCount; i++) {
  result[i] = Math.abs((hash1 + i * hash2) % max);
 }
 return result;
}

public int hashLong(long input) {
 return hashLong(input, seed);
}

public int hashUnsafeWords(Object base, long offset, int lengthInBytes) {
 return hashUnsafeWords(base, offset, lengthInBytes, seed);
}

public static int hashInt(int input, int seed) {
 int k1 = mixK1(input);
 int h1 = mixH1(seed, k1);
 return fmix(h1, 4);
}

public static int hashUnsafeBytes(Object base, long offset, int lengthInBytes, int seed) {
 assert (lengthInBytes >= 0): "lengthInBytes cannot be negative";
 int lengthAligned = lengthInBytes - lengthInBytes % 4;
 int h1 = hashBytesByInt(base, offset, lengthAligned, seed);
 for (int i = lengthAligned; i < lengthInBytes; i++) {
  int halfWord = Platform.getByte(base, offset + i);
  int k1 = mixK1(halfWord);
  h1 = mixH1(h1, k1);
 }
 return fmix(h1, lengthInBytes);
}

public static int hashUnsafeWords(Object base, long offset, int lengthInBytes, int seed) {
 // This is based on Guava's `Murmur32_Hasher.processRemaining(ByteBuffer)` method.
 assert (lengthInBytes % 8 == 0): "lengthInBytes must be a multiple of 8 (word-aligned)";
 int h1 = hashBytesByInt(base, offset, lengthInBytes, seed);
 return fmix(h1, lengthInBytes);
}

private static int hashBytesByInt(Object base, long offset, int lengthInBytes, int seed) {
 assert (lengthInBytes % 4 == 0);
 int h1 = seed;
 for (int i = 0; i < lengthInBytes; i += 4) {
  int halfWord = Platform.getInt(base, offset + i);
  int k1 = mixK1(halfWord);
  h1 = mixH1(h1, k1);
 }
 return h1;
}

private static int[] getHashBuckets(byte[] b, int hashCount, int max) {
 int[] result = new int[hashCount];
 int hash1 = Murmur3_x86_32.hashUnsafeBytes(b, Platform.BYTE_ARRAY_OFFSET, b.length, 0);
 int hash2 = Murmur3_x86_32.hashUnsafeBytes(b, Platform.BYTE_ARRAY_OFFSET, b.length, hash1);
 for (int i = 0; i < hashCount; i++) {
  result[i] = Math.abs((hash1 + i * hash2) % max);
 }
 return result;
}

Javadoc

32-bit Murmur3 hasher. This is based on Guava's Murmur3_32HashFunction.

Most used methods

Popular in Java

Parsing JSON documents to java classes using gson
compareTo (BigDecimal)
putExtra (Intent)
findViewById (Activity)
OutputStream (java.io)
A writable sink for bytes.Most clients will use output streams that write data to the file system (
Proxy (java.net)
This class represents proxy server settings. A created instance of Proxy stores a type and an addres
MessageFormat (java.text)
Produces concatenated messages in language-neutral way. New code should probably use java.util.Forma
Collections (java.util)
This class consists exclusively of static methods that operate on or return collections. It contains
BlockingQueue (java.util.concurrent)
A java.util.Queue that additionally supports operations that wait for the queue to become non-empty
Container (java.awt)
A generic Abstract Window Toolkit(AWT) container object is a component that can contain other AWT co
Top Vim plugins

How to useMurmur3_x86_32 in org.apache.spark.util.sketch

Best Java code snippets using org.apache.spark.util.sketch.Murmur3_x86_32 (Showing top 20 results out of 315)

How to use
Murmur3_x86_32
in
org.apache.spark.util.sketch