/* * Copyright (C) 2011 The Guava Authors * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.google.common.hash; import static com.google.common.hash.Hashing.ConcatenatedHashFunction; import static com.google.common.hash.Hashing.goodFastHash; import com.google.common.base.Charsets; import com.google.common.collect.ImmutableList; import com.google.common.collect.ImmutableTable; import com.google.common.collect.Lists; import com.google.common.collect.Table.Cell; import com.google.common.primitives.Ints; import com.google.common.testing.EqualsTester; import com.google.common.testing.NullPointerTester; import com.google.common.util.concurrent.AtomicLongMap; import junit.framework.TestCase; import java.lang.reflect.Method; import java.lang.reflect.Modifier; import java.nio.ByteBuffer; import java.util.Collections; import java.util.List; import java.util.Random; /** * Unit tests for {@link Hashing}. * * @author Dimitris Andreou * @author Kurt Alfred Kluever */ public class HashingTest extends TestCase { public void testMd5() { HashTestUtils.checkAvalanche(Hashing.md5(), 100, 0.4); HashTestUtils.checkNo2BitCharacteristics(Hashing.md5()); HashTestUtils.checkNoFunnels(Hashing.md5()); HashTestUtils.assertInvariants(Hashing.md5()); assertEquals("Hashing.md5()", Hashing.md5().toString()); } public void testSha1() { HashTestUtils.checkAvalanche(Hashing.sha1(), 100, 0.4); HashTestUtils.checkNo2BitCharacteristics(Hashing.sha1()); HashTestUtils.checkNoFunnels(Hashing.sha1()); HashTestUtils.assertInvariants(Hashing.sha1()); assertEquals("Hashing.sha1()", Hashing.sha1().toString()); } public void testSha256() { HashTestUtils.checkAvalanche(Hashing.sha256(), 100, 0.4); HashTestUtils.checkNo2BitCharacteristics(Hashing.sha256()); HashTestUtils.checkNoFunnels(Hashing.sha256()); HashTestUtils.assertInvariants(Hashing.sha256()); assertEquals("Hashing.sha256()", Hashing.sha256().toString()); } public void testSha512() { HashTestUtils.checkAvalanche(Hashing.sha512(), 100, 0.4); HashTestUtils.checkNo2BitCharacteristics(Hashing.sha512()); HashTestUtils.checkNoFunnels(Hashing.sha512()); HashTestUtils.assertInvariants(Hashing.sha512()); assertEquals("Hashing.sha512()", Hashing.sha512().toString()); } public void testCrc32() { HashTestUtils.assertInvariants(Hashing.crc32()); assertEquals("Hashing.crc32()", Hashing.crc32().toString()); } public void testAdler32() { HashTestUtils.assertInvariants(Hashing.adler32()); assertEquals("Hashing.adler32()", Hashing.adler32().toString()); } public void testMurmur3_128() { HashTestUtils.check2BitAvalanche(Hashing.murmur3_128(), 250, 0.20); HashTestUtils.checkAvalanche(Hashing.murmur3_128(), 250, 0.17); HashTestUtils.checkNo2BitCharacteristics(Hashing.murmur3_128()); HashTestUtils.checkNoFunnels(Hashing.murmur3_128()); HashTestUtils.assertInvariants(Hashing.murmur3_128()); assertEquals("Hashing.murmur3_128(0)", Hashing.murmur3_128().toString()); } public void testMurmur3_32() { HashTestUtils.check2BitAvalanche(Hashing.murmur3_32(), 250, 0.20); HashTestUtils.checkAvalanche(Hashing.murmur3_32(), 250, 0.17); HashTestUtils.checkNo2BitCharacteristics(Hashing.murmur3_32()); HashTestUtils.checkNoFunnels(Hashing.murmur3_32()); HashTestUtils.assertInvariants(Hashing.murmur3_32()); assertEquals("Hashing.murmur3_32(0)", Hashing.murmur3_32().toString()); } public void testSipHash24() { HashTestUtils.check2BitAvalanche(Hashing.sipHash24(), 250, 0.14); HashTestUtils.checkAvalanche(Hashing.sipHash24(), 250, 0.10); HashTestUtils.checkNo2BitCharacteristics(Hashing.sipHash24()); HashTestUtils.checkNoFunnels(Hashing.sipHash24()); HashTestUtils.assertInvariants(Hashing.sipHash24()); assertEquals("Hashing.sipHash24(506097522914230528, 1084818905618843912)", Hashing.sipHash24().toString()); } public void testGoodFastHash() { for (int i = 1; i < 200; i += 17) { HashFunction hasher = Hashing.goodFastHash(i); assertTrue(hasher.bits() >= i); HashTestUtils.assertInvariants(hasher); } } // goodFastHash(32) uses Murmur3_32. Use the same epsilon bounds. public void testGoodFastHash32() { HashTestUtils.check2BitAvalanche(Hashing.goodFastHash(32), 250, 0.20); HashTestUtils.checkAvalanche(Hashing.goodFastHash(32), 250, 0.17); HashTestUtils.checkNo2BitCharacteristics(Hashing.goodFastHash(32)); HashTestUtils.checkNoFunnels(Hashing.goodFastHash(32)); HashTestUtils.assertInvariants(Hashing.goodFastHash(32)); } // goodFastHash(128) uses Murmur3_128. Use the same epsilon bounds. public void testGoodFastHash128() { HashTestUtils.check2BitAvalanche(Hashing.goodFastHash(128), 250, 0.20); HashTestUtils.checkAvalanche(Hashing.goodFastHash(128), 250, 0.17); HashTestUtils.checkNo2BitCharacteristics(Hashing.goodFastHash(128)); HashTestUtils.checkNoFunnels(Hashing.goodFastHash(128)); HashTestUtils.assertInvariants(Hashing.goodFastHash(128)); } // goodFastHash(256) uses Murmur3_128. Use the same epsilon bounds. public void testGoodFastHash256() { HashTestUtils.check2BitAvalanche(Hashing.goodFastHash(256), 250, 0.20); HashTestUtils.checkAvalanche(Hashing.goodFastHash(256), 250, 0.17); HashTestUtils.checkNo2BitCharacteristics(Hashing.goodFastHash(256)); HashTestUtils.checkNoFunnels(Hashing.goodFastHash(256)); HashTestUtils.assertInvariants(Hashing.goodFastHash(256)); } public void testPadToLong() { assertEquals(0x1111111111111111L, Hashing.padToLong(HashCodes.fromLong(0x1111111111111111L))); assertEquals(0x9999999999999999L, Hashing.padToLong(HashCodes.fromLong(0x9999999999999999L))); assertEquals(0x0000000011111111L, Hashing.padToLong(HashCodes.fromInt(0x11111111))); assertEquals(0x0000000099999999L, Hashing.padToLong(HashCodes.fromInt(0x99999999))); } public void testConsistentHash_correctness() { long[] interestingValues = { -1, 0, 1, 2, Long.MAX_VALUE, Long.MIN_VALUE }; for (long h : interestingValues) { checkConsistentHashCorrectness(h); } Random r = new Random(7); for (int i = 0; i < 20; i++) { checkConsistentHashCorrectness(r.nextLong()); } } private void checkConsistentHashCorrectness(long hashCode) { int last = 0; for (int shards = 1; shards <= 100000; shards++) { int b = Hashing.consistentHash(hashCode, shards); if (b != last) { assertEquals(shards - 1, b); last = b; } } } public void testConsistentHash_probabilities() { AtomicLongMap<Integer> map = AtomicLongMap.create(); Random r = new Random(9); for (int i = 0; i < ITERS; i++) { countRemaps(r.nextLong(), map); } for (int shard = 2; shard <= MAX_SHARDS; shard++) { // Rough: don't exceed 1.2x the expected number of remaps by more than 20 assertTrue(map.get(shard) <= 1.2 * ITERS / shard + 20); } } private void countRemaps(long h, AtomicLongMap<Integer> map) { int last = 0; for (int shards = 2; shards <= MAX_SHARDS; shards++) { int chosen = Hashing.consistentHash(h, shards); if (chosen != last) { map.incrementAndGet(shards); last = chosen; } } } private static final int ITERS = 10000; private static final int MAX_SHARDS = 500; public void testConsistentHash_outOfRange() { try { Hashing.consistentHash(5L, 0); fail(); } catch (IllegalArgumentException expected) { } } public void testConsistentHash_ofHashCode() { checkSameResult(HashCode.fromLong(1), 1); checkSameResult(HashCode.fromLong(0x9999999999999999L), 0x9999999999999999L); checkSameResult(HashCode.fromInt(0x99999999), 0x0000000099999999L); } public void checkSameResult(HashCode hashCode, long equivLong) { assertEquals(Hashing.consistentHash(equivLong, 5555), Hashing.consistentHash(hashCode, 5555)); } /** * Check a few "golden" values to see that implementations across languages * are equivalent. */ public void testConsistentHash_linearCongruentialGeneratorCompatibility() { int[] golden100 = { 0, 55, 62, 8, 45, 59, 86, 97, 82, 59, 73, 37, 17, 56, 86, 21, 90, 37, 38, 83 }; for (int i = 0; i < golden100.length; i++) { assertEquals(golden100[i], Hashing.consistentHash(i, 100)); } assertEquals(6, Hashing.consistentHash(10863919174838991L, 11)); assertEquals(3, Hashing.consistentHash(2016238256797177309L, 11)); assertEquals(5, Hashing.consistentHash(1673758223894951030L, 11)); assertEquals(80343, Hashing.consistentHash(2, 100001)); assertEquals(22152, Hashing.consistentHash(2201, 100001)); assertEquals(15018, Hashing.consistentHash(2202, 100001)); } private static final double MAX_PERCENT_SPREAD = 0.5; private static final long RANDOM_SEED = 177L; public void testCombineOrdered_empty() { try { Hashing.combineOrdered(Collections.<HashCode>emptySet()); fail(); } catch (IllegalArgumentException expected) { } } public void testCombineOrdered_differentBitLengths() { try { Hashing.combineOrdered(ImmutableList.of(HashCode.fromInt(32), HashCode.fromLong(32L))); fail(); } catch (IllegalArgumentException expected) { } } public void testCombineOrdered() { HashCode hash31 = HashCode.fromInt(31); HashCode hash32 = HashCode.fromInt(32); assertEquals(hash32, Hashing.combineOrdered(ImmutableList.of(hash32))); assertEquals(HashCode.fromBytes(new byte[] { (byte) 0x80, 0, 0, 0 }), Hashing.combineOrdered(ImmutableList.of(hash32, hash32))); assertEquals(HashCode.fromBytes(new byte[] { (byte) 0xa0, 0, 0, 0 }), Hashing.combineOrdered(ImmutableList.of(hash32, hash32, hash32))); assertFalse( Hashing.combineOrdered(ImmutableList.of(hash31, hash32)).equals( Hashing.combineOrdered(ImmutableList.of(hash32, hash31)))); } public void testCombineOrdered_randomHashCodes() { Random random = new Random(7); List<HashCode> hashCodes = Lists.newArrayList(); for (int i = 0; i < 10; i++) { hashCodes.add(HashCode.fromLong(random.nextLong())); } HashCode hashCode1 = Hashing.combineOrdered(hashCodes); Collections.shuffle(hashCodes, random); HashCode hashCode2 = Hashing.combineOrdered(hashCodes); assertFalse(hashCode1.equals(hashCode2)); } public void testCombineUnordered_empty() { try { Hashing.combineUnordered(Collections.<HashCode>emptySet()); fail(); } catch (IllegalArgumentException expected) { } } public void testCombineUnordered_differentBitLengths() { try { Hashing.combineUnordered(ImmutableList.of(HashCode.fromInt(32), HashCode.fromLong(32L))); fail(); } catch (IllegalArgumentException expected) { } } public void testCombineUnordered() { HashCode hash31 = HashCode.fromInt(31); HashCode hash32 = HashCode.fromInt(32); assertEquals(hash32, Hashing.combineUnordered(ImmutableList.of(hash32))); assertEquals(HashCode.fromInt(64), Hashing.combineUnordered(ImmutableList.of(hash32, hash32))); assertEquals(HashCode.fromInt(96), Hashing.combineUnordered(ImmutableList.of(hash32, hash32, hash32))); assertEquals( Hashing.combineUnordered(ImmutableList.of(hash31, hash32)), Hashing.combineUnordered(ImmutableList.of(hash32, hash31))); } public void testCombineUnordered_randomHashCodes() { Random random = new Random(RANDOM_SEED); List<HashCode> hashCodes = Lists.newArrayList(); for (int i = 0; i < 10; i++) { hashCodes.add(HashCode.fromLong(random.nextLong())); } HashCode hashCode1 = Hashing.combineUnordered(hashCodes); Collections.shuffle(hashCodes); HashCode hashCode2 = Hashing.combineUnordered(hashCodes); assertEquals(hashCode1, hashCode2); } public void testConcatenatedHashFunction_equals() { assertEquals( new ConcatenatedHashFunction(Hashing.md5()), new ConcatenatedHashFunction(Hashing.md5())); assertEquals( new ConcatenatedHashFunction(Hashing.md5(), Hashing.murmur3_32()), new ConcatenatedHashFunction(Hashing.md5(), Hashing.murmur3_32())); } public void testConcatenatedHashFunction_bits() { assertEquals(Hashing.md5().bits(), new ConcatenatedHashFunction(Hashing.md5()).bits()); assertEquals(Hashing.md5().bits() + Hashing.murmur3_32().bits(), new ConcatenatedHashFunction(Hashing.md5(), Hashing.murmur3_32()).bits()); assertEquals(Hashing.md5().bits() + Hashing.murmur3_32().bits() + Hashing.murmur3_128().bits(), new ConcatenatedHashFunction( Hashing.md5(), Hashing.murmur3_32(), Hashing.murmur3_128()).bits()); } public void testConcatenatedHashFunction_makeHash() { byte[] md5Hash = Hashing.md5().hashLong(42L).asBytes(); byte[] murmur3Hash = Hashing.murmur3_32().hashLong(42L).asBytes(); byte[] combined = new byte[md5Hash.length + murmur3Hash.length]; ByteBuffer buffer = ByteBuffer.wrap(combined); buffer.put(md5Hash); buffer.put(murmur3Hash); assertEquals(HashCode.fromBytes(combined), new ConcatenatedHashFunction(Hashing.md5(), Hashing.murmur3_32()).hashLong(42L)); } public void testHashIntReverseBytesVsHashBytesIntsToByteArray() { int input = 42; assertEquals( Hashing.md5().hashBytes(Ints.toByteArray(input)), Hashing.md5().hashInt(Integer.reverseBytes(input))); } public void testHashIntVsForLoop() { int input = 42; HashCode expected = Hashing.md5().hashInt(input); Hasher hasher = Hashing.md5().newHasher(); for (int i = 0; i < 32; i += 8) { hasher.putByte((byte) (input >> i)); } HashCode actual = hasher.hash(); assertEquals(expected, actual); } private static final String EMPTY_STRING = ""; private static final String TQBFJOTLD = "The quick brown fox jumps over the lazy dog"; private static final String TQBFJOTLDP = "The quick brown fox jumps over the lazy dog."; private static final ImmutableTable<HashFunction, String, String> KNOWN_HASHES = ImmutableTable.<HashFunction, String, String>builder() .put(Hashing.adler32(), EMPTY_STRING, "01000000") .put(Hashing.adler32(), TQBFJOTLD, "da0fdc5b") .put(Hashing.adler32(), TQBFJOTLDP, "0810e46b") .put(Hashing.md5(), EMPTY_STRING, "d41d8cd98f00b204e9800998ecf8427e") .put(Hashing.md5(), TQBFJOTLD, "9e107d9d372bb6826bd81d3542a419d6") .put(Hashing.md5(), TQBFJOTLDP, "e4d909c290d0fb1ca068ffaddf22cbd0") .put(Hashing.murmur3_128(), EMPTY_STRING, "00000000000000000000000000000000") .put(Hashing.murmur3_128(), TQBFJOTLD, "6c1b07bc7bbc4be347939ac4a93c437a") .put(Hashing.murmur3_128(), TQBFJOTLDP, "c902e99e1f4899cde7b68789a3a15d69") .put(Hashing.murmur3_32(), EMPTY_STRING, "00000000") .put(Hashing.murmur3_32(), TQBFJOTLD, "23f74f2e") .put(Hashing.murmur3_32(), TQBFJOTLDP, "fc8bc4d5") .put(Hashing.sha1(), EMPTY_STRING, "da39a3ee5e6b4b0d3255bfef95601890afd80709") .put(Hashing.sha1(), TQBFJOTLD, "2fd4e1c67a2d28fced849ee1bb76e7391b93eb12") .put(Hashing.sha1(), TQBFJOTLDP, "408d94384216f890ff7a0c3528e8bed1e0b01621") .put(Hashing.sha256(), EMPTY_STRING, "e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855") .put(Hashing.sha256(), TQBFJOTLD, "d7a8fbb307d7809469ca9abcb0082e4f8d5651e46d3cdb762d02d0bf37c9e592") .put(Hashing.sha256(), TQBFJOTLDP, "ef537f25c895bfa782526529a9b63d97aa631564d5d789c2b765448c8635fb6c") .put(Hashing.sha512(), EMPTY_STRING, "cf83e1357eefb8bdf1542850d66d8007d620e4050b5715dc83f4a921d36ce9ce" + "47d0d13c5d85f2b0ff8318d2877eec2f63b931bd47417a81a538327af927da3e") .put(Hashing.sha512(), TQBFJOTLD, "07e547d9586f6a73f73fbac0435ed76951218fb7d0c8d788a309d785436bbb64" + "2e93a252a954f23912547d1e8a3b5ed6e1bfd7097821233fa0538f3db854fee6") .put(Hashing.sha512(), TQBFJOTLDP, "91ea1245f20d46ae9a037a989f54f1f790f0a47607eeb8a14d12890cea77a1bb" + "c6c7ed9cf205e67b7f2b8fd4c7dfd3a7a8617e45f3c463d481c7e586c39ac1ed") .put(Hashing.crc32(), EMPTY_STRING, "00000000") .put(Hashing.crc32(), TQBFJOTLD, "39a34f41") .put(Hashing.crc32(), TQBFJOTLDP, "e9259051") .put(Hashing.sipHash24(), EMPTY_STRING, "310e0edd47db6f72") .put(Hashing.sipHash24(), TQBFJOTLD, "e46f1fdc05612752") .put(Hashing.sipHash24(), TQBFJOTLDP, "9b602581fce4d4f8") .build(); public void testAllHashFunctionsHaveKnownHashes() throws Exception { for (Method method : Hashing.class.getDeclaredMethods()) { if (method.getReturnType().equals(HashFunction.class) // must return HashFunction && Modifier.isPublic(method.getModifiers()) // only the public methods && method.getParameterTypes().length == 0) { // only the seed-less grapes^W hash functions HashFunction hashFunction = (HashFunction) method.invoke(Hashing.class); assertTrue("There should be at least 3 entries in KNOWN_HASHES for " + hashFunction, KNOWN_HASHES.row(hashFunction).size() >= 3); } } } public void testKnownUtf8Hashing() { for (Cell<HashFunction, String, String> cell : KNOWN_HASHES.cellSet()) { HashFunction func = cell.getRowKey(); String input = cell.getColumnKey(); String expected = cell.getValue(); assertEquals( String.format("Known hash for hash(%s, UTF_8) failed", input), expected, func.hashString(input, Charsets.UTF_8).toString()); } } public void testNullPointers() { NullPointerTester tester = new NullPointerTester() .setDefault(HashCode.class, HashCode.fromLong(0)); tester.testAllPublicStaticMethods(Hashing.class); } public void testSeedlessHashFunctionEquals() throws Exception { assertSeedlessHashFunctionEquals(Hashing.class); } public void testSeededHashFunctionEquals() throws Exception { assertSeededHashFunctionEquals(Hashing.class); } /** * Tests equality of {@link Hashing#goodFastHash} instances. This test must be separate from * {@link #testSeededHashFunctionEquals} because the parameter to {@code goodFastHash} is a size, * not a seed, and because that size is rounded up. Thus, {@code goodFastHash} instances with * different parameters can be equal. That fact is a problem for {@code * testSeededHashFunctionEquals}. */ public void testGoodFastHashEquals() throws Exception { HashFunction hashFunction1a = goodFastHash(1); HashFunction hashFunction1b = goodFastHash(32); HashFunction hashFunction2a = goodFastHash(33); HashFunction hashFunction2b = goodFastHash(128); HashFunction hashFunction3a = goodFastHash(129); HashFunction hashFunction3b = goodFastHash(256); HashFunction hashFunction4a = goodFastHash(257); HashFunction hashFunction4b = goodFastHash(384); new EqualsTester() .addEqualityGroup(hashFunction1a, hashFunction1b) .addEqualityGroup(hashFunction2a, hashFunction2b) .addEqualityGroup(hashFunction3a, hashFunction3b) .addEqualityGroup(hashFunction4a, hashFunction4b) .testEquals(); assertEquals(hashFunction1a.toString(), hashFunction1b.toString()); assertEquals(hashFunction2a.toString(), hashFunction2b.toString()); assertEquals(hashFunction3a.toString(), hashFunction3b.toString()); assertEquals(hashFunction4a.toString(), hashFunction4b.toString()); } static void assertSeedlessHashFunctionEquals(Class<?> clazz) throws Exception { for (Method method : clazz.getDeclaredMethods()) { if (method.getReturnType().equals(HashFunction.class) // must return HashFunction && Modifier.isPublic(method.getModifiers()) // only the public methods && method.getParameterTypes().length == 0) { // only the seed-less hash functions HashFunction hashFunction1a = (HashFunction) method.invoke(clazz); HashFunction hashFunction1b = (HashFunction) method.invoke(clazz); new EqualsTester() .addEqualityGroup(hashFunction1a, hashFunction1b) .testEquals(); // Make sure we're returning not only equal instances, but constants. assertSame(hashFunction1a, hashFunction1b); assertEquals(hashFunction1a.toString(), hashFunction1b.toString()); } } } static void assertSeededHashFunctionEquals(Class<?> clazz) throws Exception { Random random = new Random(RANDOM_SEED); for (Method method : clazz.getDeclaredMethods()) { if (method.getReturnType().equals(HashFunction.class) // must return HashFunction && Modifier.isPublic(method.getModifiers()) // only the public methods && method.getParameterTypes().length != 0 // only the seeded hash functions && !method.getName().equals("goodFastHash")) { // tested in testGoodFastHashEquals Object[] params1 = new Object[method.getParameterTypes().length]; Object[] params2 = new Object[method.getParameterTypes().length]; for (int i = 0; i < params1.length; i++) { if (method.getParameterTypes()[i] == int.class) { params1[i] = random.nextInt(); params2[i] = random.nextInt(); } else if (method.getParameterTypes()[i] == long.class) { params1[i] = random.nextLong(); params2[i] = random.nextLong(); } else { fail("Unable to create a random parameter for " + method.getParameterTypes()[i]); } } HashFunction hashFunction1a = (HashFunction) method.invoke(clazz, params1); HashFunction hashFunction1b = (HashFunction) method.invoke(clazz, params1); HashFunction hashFunction2 = (HashFunction) method.invoke(clazz, params2); new EqualsTester() .addEqualityGroup(hashFunction1a, hashFunction1b) .addEqualityGroup(hashFunction2) .testEquals(); assertEquals(hashFunction1a.toString(), hashFunction1b.toString()); } } } }