com.google.common.hash.HashFunction java code examples

Refine search

private String sha1(final CharSequence source) {
 return BaseEncoding.base16()
   .encode(Hashing
     .sha1()
     .hashString(source, charset)
     .asBytes())
   .substring(0, 8).toLowerCase();
}

private String sha1(final File dir, final File sprite, final File css) throws IOException {
 try (Stream<Path> stream = Files.walk(dir.toPath())) {
  Hasher sha1 = Hashing.sha1().newHasher();
  stream.filter(p -> !Files.isDirectory(p))
    .forEach(p -> Try.run(() -> sha1.putBytes(Files.readAllBytes(p))));
  if (sprite.exists()) {
   sha1.putBytes(Files.readAllBytes(sprite.toPath()));
  }
  if (css.exists()) {
   sha1.putBytes(Files.readAllBytes(css.toPath()));
  }
  return BaseEncoding.base16().encode(sha1.hash().asBytes()).toLowerCase();
 }
}

private static void setEncryptionHeaders(
  HttpHeaders headers, String headerPrefix, Map<Option, ?> options) {
 String key = Option.CUSTOMER_SUPPLIED_KEY.getString(options);
 if (key != null) {
  BaseEncoding base64 = BaseEncoding.base64();
  HashFunction hashFunction = Hashing.sha256();
  headers.set(headerPrefix + "algorithm", "AES256");
  headers.set(headerPrefix + "key", key);
  headers.set(
    headerPrefix + "key-sha256",
    base64.encode(hashFunction.hashBytes(base64.decode(key)).asBytes()));
 }
}

public void testHashIntVsForLoop() {
 int input = 42;
 HashCode expected = Hashing.md5().hashInt(input);
 Hasher hasher = Hashing.md5().newHasher();
 for (int i = 0; i < 32; i += 8) {
  hasher.putByte((byte) (input >> i));
 }
 HashCode actual = hasher.hash();
 assertEquals(expected, actual);
}

@SuppressWarnings("deprecation")
public void testSimpleStringUtf8() {
 assertEquals(
   murmur3_32().hashBytes("ABCDefGHI\u0799".getBytes(Charsets.UTF_8)),
   murmur3_32().hashString("ABCDefGHI\u0799", Charsets.UTF_8));
}

public void testStringsConsistency() {
 for (String s : Arrays.asList("", "some", "test", "strings", "to", "try")) {
  assertEquals(HASH_FN.newHasher().putUnencodedChars(s).hash(), HASH_FN.hashUnencodedChars(s));
 }
}

 public Void call() throws Exception {
   HttpWire wire = setUp();
   InputStream in = wire.input(fromServer);
   ByteArrayOutputStream out = new ByteArrayOutputStream();// TODO
   copy(in, out);
   byte[] compare = md5().hashBytes(out.toByteArray()).asBytes();
   Thread.sleep(100);
   assertEquals(base16().lowerCase().encode(compare), checkNotNull(sysHttpStreamMd5, sysHttpStreamMd5));
   assertEquals(((BufferLogger) wire.getWireLog()).buff.toString().getBytes().length, 3331484);
   return null;
 }
}

@Test(invocationCount = 100)
public void testLessThan16Bytes()
    throws Exception
{
  byte[] data = randomBytes(ThreadLocalRandom.current().nextInt(16));
  HashCode expected = Hashing.murmur3_128().hashBytes(data);
  Slice actual = Murmur3Hash128.hash(Slices.wrappedBuffer(data));
  assertEquals(actual.getBytes(), expected.asBytes());
}

@Test(invocationCount = 100)
public void testLessThan4Bytes()
    throws Exception
{
  byte[] data = randomBytes(ThreadLocalRandom.current().nextInt(4));
  int expected = Hashing.murmur3_32().hashBytes(data).asInt();
  int actual = Murmur3Hash32.hash(Slices.wrappedBuffer(data));
  assertEquals(actual, expected);
}

final String newCommitMetadataSha1 = BaseEncoding.base16().encode(
  Hashing.sha1().hashBytes(newCommitMetadataBytes).asBytes()
);

  private void checkLoginAsTheNewUser(String expectedUsername) {
   LoginResponse response = globalAdminClient.getSessionClient().loginUserInDomainWithHashOfPassword(
      expectedUsername, "", base16().lowerCase().encode(md5().hashString("password", UTF_8).asBytes()));

   assertNotNull(response);
   assertNotNull(response.getSessionKey());
   assertNotNull(response.getJSessionId());

   client.getSessionClient().logoutUser(response.getSessionKey());
  }
}

@Test
public void testZoneKeyData()
{
  Hasher hasher = Hashing.murmur3_128().newHasher();
  SortedSet<TimeZoneKey> timeZoneKeysSortedByKey = ImmutableSortedSet.copyOf(new Comparator<TimeZoneKey>()
  {
    @Override
    public int compare(TimeZoneKey left, TimeZoneKey right)
    {
      return Short.compare(left.getKey(), right.getKey());
    }
  }, TimeZoneKey.getTimeZoneKeys());
  for (TimeZoneKey timeZoneKey : timeZoneKeysSortedByKey) {
    hasher.putShort(timeZoneKey.getKey());
    hasher.putString(timeZoneKey.getId(), StandardCharsets.UTF_8);
  }
  // Zone file should not (normally) be changed, so let's make this more difficult
  assertEquals(hasher.hash().asLong(), -4582158485614614451L, "zone-index.properties file contents changed!");
}

@Override
public Blob create(BlobInfo blobInfo, byte[] content, BlobTargetOption... options) {
 content = firstNonNull(content, EMPTY_BYTE_ARRAY);
 BlobInfo updatedInfo =
   blobInfo
     .toBuilder()
     .setMd5(BaseEncoding.base64().encode(Hashing.md5().hashBytes(content).asBytes()))
     .setCrc32c(
       BaseEncoding.base64()
         .encode(Ints.toByteArray(Hashing.crc32c().hashBytes(content).asInt())))
     .build();
 return internalCreate(updatedInfo, content, options);
}

@Override
public void run()
{
  byte[] hash = Hashing.sha256().hashBytes(data).asBytes();
  String hashStr = BaseEncoding.base16().encode(hash);
  archive.setHash(hash);
  String path = new StringBuilder()
    .append(hashStr.substring(0, 2))
    .append('/')
    .append(hashStr.substring(2))
    .toString();
  try
  {
    try (InputStream in = minioClient.getObject(minioBucket, path))
    {
      return; // already exists
    }
    catch (ErrorResponseException ex)
    {
      // doesn't exist
    }
    minioClient.putObject(minioBucket, path, new ByteArrayInputStream(data), data.length, "binary/octet-stream");
  }
  catch (ErrorResponseException | InsufficientDataException | InternalException | InvalidArgumentException | InvalidBucketNameException | NoResponseException | IOException | InvalidKeyException | NoSuchAlgorithmException | XmlPullParserException ex)
  {
    logger.warn("unable to upload data to store", ex);
  }
}

public void testRoundTripHashCodeUsingBaseEncoding() {
 HashCode hash1 = Hashing.sha1().hashString("foo", Charsets.US_ASCII);
 HashCode hash2 = HashCode.fromBytes(BaseEncoding.base16().lowerCase().decode(hash1.toString()));
 assertEquals(hash1, hash2);
}

byte[] md5Suffix = Hashing.md5().hashBytes((fromType + "$" + toType).getBytes()).asBytes();
    makeClassName(Joiner.on("$").join("RowCast", BaseEncoding.base16().encode(md5Suffix))),
    type(Object.class));

public void testPutAfterHash() {
 Hasher sha1 = Hashing.sha1().newHasher();
 assertEquals(
   "2fd4e1c67a2d28fced849ee1bb76e7391b93eb12",
   sha1.putString("The quick brown fox jumps over the lazy dog", Charsets.UTF_8)
     .hash()
     .toString());
 try {
  sha1.putInt(42);
  fail();
 } catch (IllegalStateException expected) {
 }
}

private static void assertHashBytesEquivalence(HashFunction hashFunction, Random random) {
 int size = random.nextInt(2048);
 byte[] bytes = new byte[size];
 random.nextBytes(bytes);
 assertEquals(
   hashFunction.hashBytes(bytes), hashFunction.newHasher(size).putBytes(bytes).hash());
 int off = random.nextInt(size);
 int len = random.nextInt(size - off);
 assertEquals(
   hashFunction.hashBytes(bytes, off, len),
   hashFunction.newHasher(size).putBytes(bytes, off, len).hash());
}

public void testHashTwice() {
 Hasher hasher = Hashing.hmacMd5(MD5_KEY).newHasher();
 assertEquals(
   "9753980fe94daa8ecaa82216519393a9",
   hasher.putString("The quick brown fox jumps over the lazy dog", UTF_8).hash().toString());
 try {
  hasher.hash();
  fail();
 } catch (IllegalStateException expected) {
 }
}

 @Test(groups = "fast")
 public void testPumaAndGuavaLongMurmurHash() throws Exception {
  // our impl is slightly faster, and this is just a check to see we match guava
  HashFunction function = Hashing.murmur3_128((int) MurmurHash.JCOMMON_SEED);
  int numToCheck = 10000;

  for (int i = 0; i < numToCheck; i++) {
   long input = random.nextLong();

   Assert.assertEquals(repeatableHasher.hash(input), function.hashLong(input).asLong());
  }

 }
}

Javadoc

A hash function is a collision-averse pure function that maps an arbitrary block of data to a number called a hash code.

Definition

Unpacking this definition:

block of data: the input for a hash function is always, in concept, an ordered byte array. This hashing API accepts an arbitrary sequence of byte and multibyte values (via Hasher), but this is merely a convenience; these are always translated into raw byte sequences under the covers.
hash code: each hash function always yields hash codes of the same fixed bit length (given by #bits). For example, Hashing#sha1 produces a 160-bit number, while Hashing#murmur3_32() yields only 32 bits. Because a long value is clearly insufficient to hold all hash code values, this API represents a hash code as an instance of HashCode.
pure function: the value produced must depend only on the input bytes, in the order they appear. Input data is never modified. HashFunction instances should always be stateless, and therefore thread-safe.
collision-averse: while it can't be helped that a hash function will sometimes produce the same hash code for distinct inputs (a "collision"), every hash function strives to some degree to make this unlikely. (Without this condition, a function that always returns zero could be called a hash function. It is not.)

Summarizing the last two points: "equal yield equal always; unequal yield unequal often." This is the most important characteristic of all hash functions.

Desirable properties

A high-quality hash function strives for some subset of the following virtues:

collision-resistant: while the definition above requires making at least some token attempt, one measure of the quality of a hash function is how well it succeeds at this goal. Important note: it may be easy to achieve the theoretical minimum collision rate when using completely random sample input. The true test of a hash function is how it performs on representative real-world data, which tends to contain many hidden patterns and clumps. The goal of a good hash function is to stamp these patterns out as thoroughly as possible.
bit-dispersing: masking out any single bit from a hash code should yield only the expected twofold increase to all collision rates. Informally, the "information" in the hash code should be as evenly "spread out" through the hash code's bits as possible. The result is that, for example, when choosing a bucket in a hash table of size 2^8, any eight bits could be consistently used.
cryptographic: certain hash functions such as Hashing#sha512 are designed to make it as infeasible as possible to reverse-engineer the input that produced a given hash code, or even to discover any two distinct inputs that yield the same result. These are called cryptographic hash functions. But, whenever it is learned that either of these feats has become computationally feasible, the function is deemed "broken" and should no longer be used for secure purposes. (This is the likely eventual fate of all cryptographic hashes.)
fast: perhaps self-explanatory, but often the most important consideration. We have published microbenchmark results for many common hash functions.

Providing input to a hash function

The primary way to provide the data that your hash function should act on is via a Hasher. Obtain a new hasher from the hash function using #newHasher, "push" the relevant data into it using methods like Hasher#putBytes(byte[]), and finally ask for the HashCode when finished using Hasher#hash. (See an #newHasher of this.)

If all you want to hash is a single byte array, string or long value, there are convenient shortcut methods defined directly on HashFunction to make this easier.

Hasher accepts primitive data types, but can also accept any Object of type T provided that you implement a Funnel to specify how to "feed" data from that object into the function. (See Hasher#putObject of this.)

Compatibility note: Throughout this API, multibyte values are always interpreted in little-endian order. That is, hashing the byte array {0x01, 0x02, 0x03, 0x04}} is equivalent to hashing the int value 0x04030201. If this isn't what you need, methods such as Integer#reverseBytes and Ints#toByteArray will help.

Relationship to Object#hashCode

Java's baked-in concept of hash codes is constrained to 32 bits, and provides no separation between hash algorithms and the data they act on, so alternate hash algorithms can't be easily substituted. Also, implementations of hashCode tend to be poor-quality, in part because they end up depending on other existing poor-quality hashCode implementations, including those in many JDK classes.

Object.hashCode implementations tend to be very fast, but have weak collision prevention and no expectation of bit dispersion. This leaves them perfectly suitable for use in hash tables, because extra collisions cause only a slight performance hit, while poor bit dispersion is easily corrected using a secondary hash function (which all reasonable hash table implementations in Java use). For the many uses of hash functions beyond data structures, however, Object.hashCode almost always falls short -- hence this library.

Most used methods

hashString
Shortcut for newHasher().putString(input, charset).hash(). Characters are encoded using the given Ch
newHasher
Begins a new hash code computation as #newHasher(), but provides a hint of the expected size of the
hashBytes
Shortcut for newHasher().putBytes(input, off, len).hash(). The implementation might perform better t
hashLong
Shortcut for newHasher().putLong(input).hash(); returns the hash code for the given long value, inte
hashUnencodedChars
Shortcut for newHasher().putUnencodedChars(input).hash(). The implementation might perform better th
bits
Returns the number of bits (a multiple of 32) that each hash code produced by this hash function has
hashObject
Shortcut for newHasher().putObject(instance, funnel).hash(). The implementation might perform better
hashInt
Shortcut for newHasher().putInt(input).hash(); returns the hash code for the given int value, interp

Popular in Java

Reading from database using SQL prepared statement
getSystemService (Context)
scheduleAtFixedRate (ScheduledExecutorService)
onCreateOptionsMenu (Activity)
Format (java.text)
The base class for all formats. This is an abstract base class which specifies the protocol for clas
TimerTask (java.util)
The TimerTask class represents a task to run at a specified time. The task may be run once or repeat
XPath (javax.xml.xpath)
XPath provides access to the XPath evaluation environment and expressions. Evaluation of XPath Expr
VirtualMachine (com.sun.tools.attach)
A Java virtual machine. A VirtualMachine represents a Java virtual machine to which this Java vir
Menu (java.awt)
JCheckBox (javax.swing)
Top plugins for Android Studio

How to useHashFunction in com.google.common.hash

Best Java code snippets using com.google.common.hash.HashFunction (Showing top 20 results out of 4,599)

Refine search

How to use
HashFunction
in
com.google.common.hash