#include <stdio.h> #include <stdlib.h> #include <assert.h> typedef signed int Int; typedef unsigned int UInt; typedef unsigned long long int Addr64; typedef unsigned char UChar; typedef unsigned long int UWord; static inline UInt ROL32 ( UInt x, UInt n ) { assert(n != 0); n &= 31; x = (x << n) | (x >> (32-n)); return x; } ////////////////////////////////////////////////////////// typedef struct { Addr64 ga; Int nbytes; UChar* bytes; UChar* actual; } GuestBytes; GuestBytes* read_one ( FILE* f ) { Int r; UInt i; UInt esum, csum; GuestBytes* gb = malloc(sizeof(GuestBytes)); assert(gb); if (feof(f)) return NULL; assert(!ferror(f)); r= fscanf(f, "GuestBytes %llx %d ", &gb->ga, &gb->nbytes); if (0) printf("r = %d\n", r); assert(r == 2); assert(gb->ga != 0); assert(gb->nbytes > 0); assert(gb->nbytes < 5000); // let's say Int nToAlloc = gb->nbytes + (gb->ga & 3); gb->bytes = malloc( gb->nbytes + nToAlloc); gb->actual = gb->bytes + (gb->ga & 3); assert(gb->bytes); csum = 0; for (i = 0; i < gb->nbytes; i++) { UInt b; r= fscanf(f, "%02x ", &b); assert(r == 1); gb->actual[i] = b; csum = (csum << 1) ^ b; } r= fscanf(f, " %08x\n", &esum); assert(r == 1); assert(esum == csum); return gb; } ////////////////////////////////////////////////////////// void apply_to_all ( FILE* f, void(*fn)( GuestBytes*, void* ), void* opaque ) { while (!feof(f)) { GuestBytes* gb = read_one(f); if (0) printf("got %llu %d\n", gb->ga, gb->nbytes); fn( gb, opaque ); free(gb->bytes); free(gb); } } ////////////////////////////////////////////////////////// UInt hash_const_zero ( GuestBytes* gb ) { return 0; } UInt hash_sum ( GuestBytes* gb ) { UInt i, sum = 0; for (i = 0; i < gb->nbytes; i++) sum += (UInt)gb->actual[i]; return sum; } UInt hash_rol ( GuestBytes* gb ) { UInt i, sum = 0; for (i = 0; i < gb->nbytes; i++) { sum ^= (UInt)gb->actual[i]; sum = ROL32(sum,7); } return sum; } static UInt cand0 ( GuestBytes* gb ) { UWord addr = (UWord)gb->actual; UWord len = gb->nbytes; UInt sum = 0; /* pull up to 4-alignment */ while ((addr & 3) != 0 && len >= 1) { UChar* p = (UChar*)addr; sum = (sum << 8) | (UInt)p[0]; addr++; len--; } /* vectorised + unrolled */ while (len >= 16) { UInt* p = (UInt*)addr; sum = ROL32(sum ^ p[0], 13); sum = ROL32(sum ^ p[1], 13); sum = ROL32(sum ^ p[2], 13); sum = ROL32(sum ^ p[3], 13); addr += 16; len -= 16; } /* vectorised fixup */ while (len >= 4) { UInt* p = (UInt*)addr; sum = ROL32(sum ^ p[0], 13); addr += 4; len -= 4; } /* scalar fixup */ while (len >= 1) { UChar* p = (UChar*)addr; sum = ROL32(sum ^ (UInt)p[0], 19); addr++; len--; } return sum; } static UInt cand1 ( GuestBytes* gb ) { UWord addr = (UWord)gb->actual; UWord len = gb->nbytes; UInt sum1 = 0, sum2 = 0; /* pull up to 4-alignment */ while ((addr & 3) != 0 && len >= 1) { UChar* p = (UChar*)addr; sum1 = (sum1 << 8) | (UInt)p[0]; addr++; len--; } /* vectorised + unrolled */ while (len >= 16) { UInt* p = (UInt*)addr; UInt w; w = p[0]; sum1 = ROL32(sum1 ^ w, 31); sum2 += w; w = p[1]; sum1 = ROL32(sum1 ^ w, 31); sum2 += w; w = p[2]; sum1 = ROL32(sum1 ^ w, 31); sum2 += w; w = p[3]; sum1 = ROL32(sum1 ^ w, 31); sum2 += w; addr += 16; len -= 16; sum1 ^= sum2; } /* vectorised fixup */ while (len >= 4) { UInt* p = (UInt*)addr; UInt w = p[0]; sum1 = ROL32(sum1 ^ w, 31); sum2 += w; addr += 4; len -= 4; sum1 ^= sum2; } /* scalar fixup */ while (len >= 1) { UChar* p = (UChar*)addr; UInt w = (UInt)p[0]; sum1 = ROL32(sum1 ^ w, 31); sum2 += w; addr++; len--; } return sum1 + sum2; } static UInt adler32 ( GuestBytes* gb ) { UWord addr = (UWord)gb->actual; UWord len = gb->nbytes; UInt s1 = 1; UInt s2 = 0; UChar* buf = (UChar*)addr; while (len >= 4) { s1 += buf[0]; s2 += s1; s1 += buf[1]; s2 += s1; s1 += buf[2]; s2 += s1; s1 += buf[3]; s2 += s1; buf += 4; len -= 4; } while (len > 0) { s1 += buf[0]; s2 += s1; len--; buf++; } return (s2 << 16) + s1; } ////////////////////////////////////////////////////////// UInt (*theFn)(GuestBytes*) = //hash_const_zero; //hash_sum; //hash_rol; //cand0; cand1; //adler32; Int cmp_UInt_ps ( UInt* p1, UInt* p2 ) { if (*p1 < *p2) return -1; if (*p1 > *p2) return 1; return 0; } Int nSetBits ( UInt w ) { Int i, j; j = 0; for (i = 0; i < 32; i++) if (w & (1<<i)) j++; return j; } Int toc_nblocks = 0; Int toc_nblocks_with_zero = 0; double toc_sum_of_avgs = 0.0; void invertBit ( UChar* b, UInt ix, UInt bix ) { b[ix] ^= (1 << bix); } void try_onebit_changes( GuestBytes* gb, void* opaque ) { toc_nblocks++; /* collect up the hash values for all one bit changes of the key, and also that for the unmodified key. Then compute the number of changed bits for all of them. */ UInt hashIx = 0; UInt nHashes = 8 * gb->nbytes; UInt* hashes = malloc( nHashes * sizeof(UInt) ); UInt byteIx, bitIx; UInt hInit, hFinal, hRunning; Int dist, totDist = 0, nNoDist = 0; assert(hashes); hInit = theFn( gb ); for (byteIx = 0; byteIx < gb->nbytes; byteIx++) { for (bitIx = 0; bitIx < 8; bitIx++) { invertBit(gb->actual, byteIx, bitIx); //invertBit(gb->actual, byteIx, bitIx ^ 4); hRunning = theFn( gb ); dist = nSetBits(hRunning ^ hInit); totDist += dist; if (dist == 0) nNoDist++; hashes[hashIx++] = hRunning; invertBit(gb->actual, byteIx, bitIx); //invertBit(gb->actual, byteIx, bitIx ^ 4); if (0) printf(" %02d.%d %08x %d\n", byteIx, bitIx, hRunning ^ hInit, dist); } } hFinal = theFn( gb ); assert(hFinal == hInit); assert(hashIx == nHashes); if (nNoDist > 0) printf("%4d measurements, %5.2f avg dist, %2d zeroes\n", (Int)nHashes, (double)totDist / (double)nHashes, nNoDist); else printf("%4d measurements, %5.2f avg dist\n", (Int)nHashes, (double)totDist / (double)nHashes); if (nNoDist > 0) toc_nblocks_with_zero++; toc_sum_of_avgs += (double)totDist / (double)nHashes; free(hashes); } ////////////////////////////////////////////////////////// int main ( void ) { FILE* f = stdin; apply_to_all(f, try_onebit_changes, NULL); printf("\n%d blocks, %d with a zero, %5.2f avg avg\n\n", toc_nblocks, toc_nblocks_with_zero, toc_sum_of_avgs / (double)toc_nblocks ); return 0; } //////////////////////////////////////////////////////////