2 * Copyright (c) 2009, 2012, 2014 Nicira, Inc.
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at:
8 * http://www.apache.org/licenses/LICENSE-2.0
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
29 set_bit(uint32_t array[3], int bit)
31 assert(bit >= 0 && bit <= 96);
32 memset(array, 0, sizeof(uint32_t) * 3);
34 array[bit / 32] = UINT32_C(1) << (bit % 32);
39 hash_words_cb(uint32_t input)
41 return hash_words(&input, 1, 0);
45 jhash_words_cb(uint32_t input)
47 return jhash_words(&input, 1, 0);
51 hash_int_cb(uint32_t input)
53 return hash_int(input, 0);
57 check_word_hash(uint32_t (*hash)(uint32_t), const char *name,
62 for (i = 0; i <= 32; i++) {
63 uint32_t in1 = i < 32 ? UINT32_C(1) << i : 0;
64 for (j = i + 1; j <= 32; j++) {
65 uint32_t in2 = j < 32 ? UINT32_C(1) << j : 0;
66 uint32_t out1 = hash(in1);
67 uint32_t out2 = hash(in2);
68 const uint32_t unique_mask = (UINT32_C(1) << min_unique) - 1;
70 for (ofs = 0; ofs < 32 - min_unique; ofs++) {
71 uint32_t bits1 = (out1 >> ofs) & unique_mask;
72 uint32_t bits2 = (out2 >> ofs) & unique_mask;
74 printf("Partial collision for '%s':\n", name);
75 printf("%s(%08"PRIx32") = %08"PRIx32"\n", name, in1, out1);
76 printf("%s(%08"PRIx32") = %08"PRIx32"\n", name, in2, out2);
77 printf("%d bits of output starting at bit %d "
78 "are both 0x%"PRIx32"\n", min_unique, ofs, bits1);
87 check_3word_hash(uint32_t (*hash)(const uint32_t[], size_t, uint32_t),
92 for (i = 0; i <= 96; i++) {
93 for (j = i + 1; j <= 96; j++) {
94 uint32_t in0[3], in1[3], in2[3];
95 uint32_t out0,out1, out2;
96 const int min_unique = 12;
97 const uint32_t unique_mask = (UINT32_C(1) << min_unique) - 1;
102 out0 = hash(in0, 3, 0);
103 out1 = hash(in1, 3, 0);
104 out2 = hash(in2, 3, 0);
107 printf("%s hash not the same for non-64 aligned data "
108 "%08"PRIx32" != %08"PRIx32"\n", name, out0, out1);
110 if ((out1 & unique_mask) == (out2 & unique_mask)) {
111 printf("%s has a partial collision:\n", name);
112 printf("hash(1 << %d) == %08"PRIx32"\n", i, out1);
113 printf("hash(1 << %d) == %08"PRIx32"\n", j, out2);
114 printf("The low-order %d bits of output are both "
115 "0x%"PRIx32"\n", min_unique, out1 & unique_mask);
122 test_hash_main(int argc OVS_UNUSED, char *argv[] OVS_UNUSED)
124 /* Check that all hashes computed with hash_words with one 1-bit (or no
125 * 1-bits) set within a single 32-bit word have different values in all
126 * 11-bit consecutive runs.
128 * Given a random distribution, the probability of at least one collision
129 * in any set of 11 bits is approximately
131 * 1 - (proportion of same_bits)
132 * **(binomial_coefficient(n_bits_in_data + 1, 2))
133 * == 1 - ((2**11 - 1)/2**11)**C(33,2)
134 * == 1 - (2047/2048)**528
137 * There are 21 ways to pick 11 consecutive bits in a 32-bit word, so if we
138 * assumed independence then the chance of having no collisions in any of
139 * those 11-bit runs would be (1-0.22)**21 =~ .0044. Obviously
140 * independence must be a bad assumption :-)
142 check_word_hash(hash_words_cb, "hash_words", 11);
143 check_word_hash(jhash_words_cb, "jhash_words", 11);
145 /* Check that all hash functions of with one 1-bit (or no 1-bits) set
146 * within three 32-bit words have different values in their lowest 12
149 * Given a random distribution, the probability of at least one collision
150 * in 12 bits is approximately
152 * 1 - ((2**12 - 1)/2**12)**C(97,2)
153 * == 1 - (4095/4096)**4656
156 * so we are doing pretty well to not have any collisions in 12 bits.
158 check_3word_hash(hash_words, "hash_words");
159 check_3word_hash(jhash_words, "jhash_words");
161 /* Check that all hashes computed with hash_int with one 1-bit (or no
162 * 1-bits) set within a single 32-bit word have different values in all
163 * 12-bit consecutive runs.
165 * Given a random distribution, the probability of at least one collision
166 * in any set of 12 bits is approximately
168 * 1 - ((2**12 - 1)/2**12)**C(33,2)
169 * == 1 - (4,095/4,096)**528
172 * There are 20 ways to pick 12 consecutive bits in a 32-bit word, so if we
173 * assumed independence then the chance of having no collisions in any of
174 * those 12-bit runs would be (1-0.12)**20 =~ 0.078. This refutes our
175 * assumption of independence, which makes it seem like a good hash
178 check_word_hash(hash_int_cb, "hash_int", 12);
181 OVSTEST_REGISTER("test-hash", test_hash_main);